Update tests for multi-gpu training

author: Roman Grundkiewicz <rgrundkiewicz@gmail.com> 2020-10-21 14:58:25 +0300
committer: Roman Grundkiewicz <rgrundkiewicz@gmail.com> 2020-10-21 14:58:25 +0300
commit: 0ca3c2877f205170db6260ef379162bccfea35f1 (patch)
tree: 2f474dcc983976a245359d00d3850dfe0f465514 /tests
parent: b7f466c361d593a247fc866ad25ef4458cfb597e (diff)
6 files changed, 8 insertions, 4 deletions
diff --git a/tests/training/multi-gpu/test_async_sgd_runs.sh b/tests/training/multi-gpu/test_async_sgd_runs.sh
index 1094cd2..5043548 100644
--- a/tests/training/multi-gpu/test_async_sgd_runs.sh
+++ b/tests/training/multi-gpu/test_async_sgd_runs.sh
@@ -13,7 +13,7 @@ rm -rf async_sgd async_sgd.log
 mkdir -p async_sgd
 
 $MRT_MARIAN/marian \
-    --no-shuffle --seed 1111 --maxi-batch 1 --maxi-batch-sort none --dim-emb 128 --dim-rnn 256 \
+    --no-shuffle --seed 1111 --maxi-batch 1 --maxi-batch-sort none --dim-emb 128 --dim-rnn 256 --cost-type ce-mean \
     --devices 0 1 \
     -m async_sgd/model.npz -t $MRT_DATA/europarl.de-en/corpus.bpe.{en,de} -v vocab.en.yml vocab.de.yml \
     --disp-freq 20 --after-batches 400 \
diff --git a/tests/training/multi-gpu/test_sync_sgd.sh b/tests/training/multi-gpu/test_sync_sgd.sh
index ac2d009..ca29645 100644
--- a/tests/training/multi-gpu/test_sync_sgd.sh
+++ b/tests/training/multi-gpu/test_sync_sgd.sh
@@ -15,7 +15,7 @@ mkdir -p sync_sgd
 $MRT_MARIAN/marian \
     --no-shuffle --seed 777 --mini-batch 4 --maxi-batch 1 --maxi-batch-sort none \
     --dim-rnn 64 --dim-emb 32 --learn-rate 0.001 --clip-norm 0 \
-    --devices 0 1 --sync-sgd --optimizer sgd \
+    --devices 0 1 --sync-sgd --optimizer sgd --cost-type ce-mean \
     -m sync_sgd/model.full.npz -t $MRT_DATA/europarl.de-en/corpus.bpe.{en,de} -v vocab.en.yml vocab.de.yml \
     --disp-freq 10 --after-batches 100 \
     --log sync_sgd.log
diff --git a/tests/training/multi-gpu/test_sync_sgd_1gpu.sh b/tests/training/multi-gpu/test_sync_sgd_1gpu.sh
index e3a8255..2b9c72b 100644
--- a/tests/training/multi-gpu/test_sync_sgd_1gpu.sh
+++ b/tests/training/multi-gpu/test_sync_sgd_1gpu.sh
@@ -10,7 +10,7 @@ mkdir -p sync_sgd_1gpu
 $MRT_MARIAN/marian \
     --no-shuffle --seed 888 --mini-batch 4 --maxi-batch 1 --maxi-batch-sort none \
     --dim-rnn 64 --dim-emb 32 --learn-rate 0.1 \
-    --devices 0 --sync-sgd --optimizer sgd \
+    --devices 0 --sync-sgd --optimizer sgd --cost-type ce-mean \
     -m sync_sgd_1gpu/model.npz -t $MRT_DATA/europarl.de-en/corpus.bpe.{en,de} -v vocab.en.yml vocab.de.yml \
     --disp-freq 5 --save-freq 10 --after-batches 20 \
     --log sync_sgd_1gpu.log
diff --git a/tests/training/multi-gpu/test_sync_sgd_1gpu_expsmooth.sh b/tests/training/multi-gpu/test_sync_sgd_1gpu_expsmooth.sh
index 510aa26..d1d77d3 100644
--- a/tests/training/multi-gpu/test_sync_sgd_1gpu_expsmooth.sh
+++ b/tests/training/multi-gpu/test_sync_sgd_1gpu_expsmooth.sh
@@ -10,7 +10,7 @@ mkdir -p sync_sgd_1gpu_expsmooth
 $MRT_MARIAN/marian \
     --no-shuffle --seed 888 --mini-batch 4 --maxi-batch 1 --maxi-batch-sort none \
     --dim-rnn 64 --dim-emb 32 --learn-rate 0.1 \
-    --devices 0 --sync-sgd --optimizer sgd --exponential-smoothing \
+    --devices 0 --sync-sgd --optimizer sgd --exponential-smoothing --cost-type ce-mean \
     -m sync_sgd_1gpu_expsmooth/model.npz -t $MRT_DATA/europarl.de-en/corpus.bpe.{en,de} -v vocab.en.yml vocab.de.yml \
     --disp-freq 5 --save-freq 10 --after-batches 20 \
     --log sync_sgd_1gpu_expsmooth.log
diff --git a/tests/training/restarting/test_sgd_for_two_epochs.sh b/tests/training/restarting/test_sgd_for_two_epochs.sh
index abef975..ad92b5f 100644
--- a/tests/training/restarting/test_sgd_for_two_epochs.sh
+++ b/tests/training/restarting/test_sgd_for_two_epochs.sh
@@ -8,6 +8,8 @@ rm -rf sgd_2e sgd_1st_epoch.log sgd_2nd_epoch.log
 mkdir -p sgd_2e
 
 extra_opts="--no-shuffle --seed 1111 --maxi-batch 1 --maxi-batch-sort none --mini-batch 32 --optimizer sgd"
+# Added because default options has changes
+extra_opts="$extra_opts --cost-type ce-mean --disp-label-counts false"
 
 
 # Uncomment to prepare the expected output
diff --git a/tests/training/restarting/test_sgd_for_two_epochs_sync.sh b/tests/training/restarting/test_sgd_for_two_epochs_sync.sh
index 4808894..d3ee295 100644
--- a/tests/training/restarting/test_sgd_for_two_epochs_sync.sh
+++ b/tests/training/restarting/test_sgd_for_two_epochs_sync.sh
@@ -8,6 +8,8 @@ rm -rf sgd_sync_2e sgd_sync_*_epoch.log
 mkdir -p sgd_sync_2e
 
 extra_opts="--no-shuffle --seed 1111 --maxi-batch 1 --maxi-batch-sort none --mini-batch 32 --optimizer sgd --sync-sgd"
+# Added because default options has changes
+extra_opts="$extra_opts --cost-type ce-mean --disp-label-counts false"
 
 
 # Uncomment to prepare the expected output
author	Roman Grundkiewicz <rgrundkiewicz@gmail.com>	2020-10-21 14:58:25 +0300
committer	Roman Grundkiewicz <rgrundkiewicz@gmail.com>	2020-10-21 14:58:25 +0300
commit	0ca3c2877f205170db6260ef379162bccfea35f1 (patch)
tree	2f474dcc983976a245359d00d3850dfe0f465514 /tests
parent	b7f466c361d593a247fc866ad25ef4458cfb597e (diff)