fix script again

This commit is contained in:
Meeeeee6623 2021-09-20 23:20:01 -04:00
parent b0de218fcc
commit dbf04bae44

View file

@ -1,14 +1,17 @@
# nvidia-docker run --rm -it --ipc=host -v /work/chauhans/imagenet:/imagenet rn50_tf1
for (( n = 0; i < 3; n++ )); do
for (( i = 0; i < 91; i++ )); do
for (( n = 0; i < 3; n++ ));
do
mkdir /imagenet/TensorFlow/run_"${i}"/model
for (( i = 0; i < 91; i++ ));
do
mkdir /imagenet/TensorFlow/run_"${n}"/epoch_"${i}"/
echo "Created Folder epoch_${i}"
mpiexec --allow-run-as-root --bind-to socket -np 2 python3 main.py --arch=resnet50 --mode=train_and_evaluate \
--num_iter="${i}" --batch_size=192 --warmup_steps=0 --lr_warmup_epochs=0 --model_dir=/imagenet/TensorFlow/model \
--num_iter="${i}" --batch_size=192 --warmup_steps=0 --lr_warmup_epochs=0 --model_dir=/imagenet/TensorFlow/run_"${i}"/model \
--data_dir=/imagenet/tfrecords --data_idx_dir=/imagenet/dali_idx \
--results_dir=/imagenet/TensorFlow/run_"${n}"/epoch_"${i}"/ \
--export_dir=/imagenet/TensorFlow/model --weight_init=fan_in --amp --log_filename run_"${n}"epoch_"${i}".json
--export_dir=/imagenet/TensorFlow/run_"${i}"/model --weight_init=fan_in --amp --log_filename run_"${n}"epoch_"${i}".json
echo "Epoch ${i} done"
done
echo "Run ${n} done"