Skip to content

Commit aaf5084

Browse files
committed
udpates
1 parent b12c7dd commit aaf5084

File tree

3 files changed

+4
-4
lines changed

3 files changed

+4
-4
lines changed

TensorFlow/LanguageModeling/BERT/scripts/run_pretraining_lamb.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ learning_rate_phase1=${4:-"7.5e-4"}
2222
learning_rate_phase2=${5:-"5e-4"}
2323
precision=${6:-"fp16"}
2424
use_xla=${7:-"true"}
25-
num_gpus=${8:-1}
25+
num_gpus=${8:-8}
2626
warmup_steps_phase1=${9:-"2000"}
2727
warmup_steps_phase2=${10:-"200"}
2828
train_steps=${11:-7820}

TensorFlow/LanguageModeling/BERT/scripts/run_pretraining_lamb_phase1.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ learning_rate_phase1=${4:-"7.5e-4"}
2222
learning_rate_phase2=${5:-"5e-4"}
2323
precision=${6:-"fp16"}
2424
use_xla=${7:-"true"}
25-
num_gpus=${8:-1}
25+
num_gpus=${8:-2}
2626
warmup_steps_phase1=${9:-"2000"}
2727
warmup_steps_phase2=${10:-"200"}
2828
train_steps=${11:-7820}
@@ -60,7 +60,7 @@ fi
6060

6161
mpi=""
6262
if [ $num_gpus -gt 1 ] ; then
63-
mpi="mpiexec --allow-run-as-root -np $num_gpus --bind-to socket"
63+
mpi="mpiexec --allow-run-as-root -np $num_gpus --bind-to socket --oversubscribe"
6464
fi
6565

6666
#PHASE 1

TensorFlow/LanguageModeling/BERT/scripts/run_pretraining_lamb_phase2.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ learning_rate_phase1=${4:-"7.5e-4"}
2222
learning_rate_phase2=${5:-"5e-4"}
2323
precision=${6:-"fp16"}
2424
use_xla=${7:-"true"}
25-
num_gpus=${8:-1}
25+
num_gpus=${8:-2}
2626
warmup_steps_phase1=${9:-"2000"}
2727
warmup_steps_phase2=${10:-"200"}
2828
train_steps=${11:-7820}

0 commit comments

Comments
 (0)