File tree Expand file tree Collapse file tree 3 files changed +4
-4
lines changed
TensorFlow/LanguageModeling/BERT/scripts Expand file tree Collapse file tree 3 files changed +4
-4
lines changed Original file line number Diff line number Diff line change @@ -22,7 +22,7 @@ learning_rate_phase1=${4:-"7.5e-4"}
2222learning_rate_phase2=${5:- " 5e-4" }
2323precision=${6:- " fp16" }
2424use_xla=${7:- " true" }
25- num_gpus=${8:- 1 }
25+ num_gpus=${8:- 8 }
2626warmup_steps_phase1=${9:- " 2000" }
2727warmup_steps_phase2=${10:- " 200" }
2828train_steps=${11:- 7820}
Original file line number Diff line number Diff line change @@ -22,7 +22,7 @@ learning_rate_phase1=${4:-"7.5e-4"}
2222learning_rate_phase2=${5:- " 5e-4" }
2323precision=${6:- " fp16" }
2424use_xla=${7:- " true" }
25- num_gpus=${8:- 1 }
25+ num_gpus=${8:- 2 }
2626warmup_steps_phase1=${9:- " 2000" }
2727warmup_steps_phase2=${10:- " 200" }
2828train_steps=${11:- 7820}
6060
6161mpi=" "
6262if [ $num_gpus -gt 1 ] ; then
63- mpi=" mpiexec --allow-run-as-root -np $num_gpus --bind-to socket"
63+ mpi=" mpiexec --allow-run-as-root -np $num_gpus --bind-to socket --oversubscribe "
6464fi
6565
6666# PHASE 1
Original file line number Diff line number Diff line change @@ -22,7 +22,7 @@ learning_rate_phase1=${4:-"7.5e-4"}
2222learning_rate_phase2=${5:- " 5e-4" }
2323precision=${6:- " fp16" }
2424use_xla=${7:- " true" }
25- num_gpus=${8:- 1 }
25+ num_gpus=${8:- 2 }
2626warmup_steps_phase1=${9:- " 2000" }
2727warmup_steps_phase2=${10:- " 200" }
2828train_steps=${11:- 7820}
You can’t perform that action at this time.
0 commit comments