Skip to content

Commit c965f4c

Browse files
authored
update bert config (tinygrad#9555)
BEAM 4->5 for green, 2% faster use AMD driver instead of AM for red, 5% faster
1 parent d734e24 commit c965f4c

File tree

2 files changed

+5
-1
lines changed

2 files changed

+5
-1
lines changed

examples/mlperf/training_submission_v5.0/tinycorp/benchmarks/bert/implementations/tinybox_green/run_and_time.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ export MODEL="bert"
55
export SUBMISSION_PLATFORM="tinybox_green"
66
export DEFAULT_FLOAT="HALF" SUM_DTYPE="HALF" GPUS=6 BS=96 EVAL_BS=96
77

8-
export BEAM=4 BEAM_UOPS_MAX=3000 BEAM_UPCAST_MAX=256 BEAM_LOCAL_MAX=1024 BEAM_MIN_PROGRESS=5
8+
export BEAM=5 BEAM_UOPS_MAX=3000 BEAM_UPCAST_MAX=256 BEAM_LOCAL_MAX=1024 BEAM_MIN_PROGRESS=5
99
export IGNORE_JIT_FIRST_BEAM=1
1010
export BASEDIR="/raid/datasets/wiki"
1111

examples/mlperf/training_submission_v5.0/tinycorp/benchmarks/bert/implementations/tinybox_red/run_and_time.sh

+4
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,11 @@ DATETIME=$(date "+%m%d%H%M")
1717
LOGFILE="bert_red_${DATETIME}_${SEED}.log"
1818

1919
# init
20+
sudo rmmod amdgpu || true
2021
BENCHMARK=10 INITMLPERF=1 RESET_STEP=1 BEAM_LOG_SURPASS_MAX=1 python3 examples/mlperf/model_train.py | tee $LOGFILE
2122

2223
# run
24+
# TODO: AMD driver hangs during init, but is 5% faster per step in real run.
25+
sudo modprobe amdgpu
2326
PARALLEL=0 RUNMLPERF=1 python3 examples/mlperf/model_train.py | tee -a $LOGFILE
27+
sudo rmmod amdgpu || true

0 commit comments

Comments
 (0)