Skip to content

Commit ec02197

Browse files
matrix small/large model with few/many files
Signed-off-by: Spencer Schrock <[email protected]>
1 parent 70a2781 commit ec02197

File tree

1 file changed

+11
-14
lines changed

1 file changed

+11
-14
lines changed

benchmarks/run.sh

Lines changed: 11 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -6,20 +6,17 @@ OUTPUT_DIR=$2
66
REVISION=$3
77
FILENAME_BASE=$OUTPUT_DIR/$(date --utc +%Y%m%d%H%M%S)_$REVISION
88

9-
for SIZE in 32 48 128; do
10-
MODEL=${SIZE}gb
11-
MODEL_PATH=$MODEL_DIR/$MODEL
12-
mkdir -p MODEL_PATH
13-
14-
# simulate a handful of small metadata files in the repository
15-
hatch run bench.py3.11:generate dir --root "$MODEL_PATH" -n 8 16384
16-
# followed by model shards which are 8GiB each
17-
N=$((${SIZE}/8))
18-
SIZE_BYTES=$(($SIZE * 1024 * 1024 * 1024))
19-
hatch run bench.py3.11:generate dir --root "$MODEL_PATH" -n "$N" "$SIZE_BYTES"
20-
21-
hatch run bench.py3.11:python benchmarks/time_serialize.py "$MODEL_PATH" \
22-
--output="${FILENAME_BASE}_${MODEL}.json"
9+
for SIZE in 32 256; do
10+
for FILES in 64 512; do
11+
MODEL=${SIZE}gb_${FILES}files
12+
MODEL_PATH=$MODEL_DIR/$MODEL
13+
mkdir -p "$MODEL_PATH"
14+
SIZE_BYTES=$((SIZE * 1024 * 1024 * 1024))
15+
hatch run bench.py3.11:generate dir --root "$MODEL_PATH" -n "$FILES" "$SIZE_BYTES"
16+
hatch run bench.py3.11:python benchmarks/time_serialize.py "$MODEL_PATH" \
17+
--output="${FILENAME_BASE}_${MODEL}.json"
18+
rm -r "${MODEL_PATH}"
19+
done
2320
done
2421

2522

0 commit comments

Comments
 (0)