From 035464b6a0cea2e6fe6c5de956f07f8c305b3c55 Mon Sep 17 00:00:00 2001 From: r-sarma <126173968+r-sarma@users.noreply.github.com> Date: Fri, 8 Dec 2023 20:52:36 +0530 Subject: [PATCH] Update general_startscript --- experimental/trainer/general_startscript | 7 +++---- 1 file changed, 3 insertions(+), 4 deletions(-) diff --git a/experimental/trainer/general_startscript b/experimental/trainer/general_startscript index a39d034f..455466b4 100755 --- a/experimental/trainer/general_startscript +++ b/experimental/trainer/general_startscript @@ -26,7 +26,7 @@ strategy='DS' # parameters debug=false # do debug bs=32 # batch-size -epochs=4 # epochs +epochs=1 # epochs lr=0.01 # learning rate # AT @@ -68,13 +68,13 @@ if [ "$SLURM_CPUS_PER_TASK" > 0 ] ; then export OMP_NUM_THREADS=$SLURM_CPUS_PER_TASK fi -COMMAND="general_trainer.py" +COMMAND="general_trainer_v2.py" #launch if [[ $strategy == *"HVD"* ]]; then EXEC="$COMMAND \ - --strat $strategy \ + --strategy $strategy \ --batch-size $bs \ --epochs $epochs \ --lr $lr \ @@ -133,4 +133,3 @@ else $EXEC --deepspeed_mpi --deepspeed_config DS_config.json fi -