diff options
author | Roman Grundkiewicz <rgrundkiewicz@gmail.com> | 2020-10-21 14:58:25 +0300 |
---|---|---|
committer | Roman Grundkiewicz <rgrundkiewicz@gmail.com> | 2020-10-21 14:58:25 +0300 |
commit | 0ca3c2877f205170db6260ef379162bccfea35f1 (patch) | |
tree | 2f474dcc983976a245359d00d3850dfe0f465514 /tests | |
parent | b7f466c361d593a247fc866ad25ef4458cfb597e (diff) |
Update tests for multi-gpu training
Diffstat (limited to 'tests')
6 files changed, 8 insertions, 4 deletions
diff --git a/tests/training/multi-gpu/test_async_sgd_runs.sh b/tests/training/multi-gpu/test_async_sgd_runs.sh index 1094cd2..5043548 100644 --- a/tests/training/multi-gpu/test_async_sgd_runs.sh +++ b/tests/training/multi-gpu/test_async_sgd_runs.sh @@ -13,7 +13,7 @@ rm -rf async_sgd async_sgd.log mkdir -p async_sgd $MRT_MARIAN/marian \ - --no-shuffle --seed 1111 --maxi-batch 1 --maxi-batch-sort none --dim-emb 128 --dim-rnn 256 \ + --no-shuffle --seed 1111 --maxi-batch 1 --maxi-batch-sort none --dim-emb 128 --dim-rnn 256 --cost-type ce-mean \ --devices 0 1 \ -m async_sgd/model.npz -t $MRT_DATA/europarl.de-en/corpus.bpe.{en,de} -v vocab.en.yml vocab.de.yml \ --disp-freq 20 --after-batches 400 \ diff --git a/tests/training/multi-gpu/test_sync_sgd.sh b/tests/training/multi-gpu/test_sync_sgd.sh index ac2d009..ca29645 100644 --- a/tests/training/multi-gpu/test_sync_sgd.sh +++ b/tests/training/multi-gpu/test_sync_sgd.sh @@ -15,7 +15,7 @@ mkdir -p sync_sgd $MRT_MARIAN/marian \ --no-shuffle --seed 777 --mini-batch 4 --maxi-batch 1 --maxi-batch-sort none \ --dim-rnn 64 --dim-emb 32 --learn-rate 0.001 --clip-norm 0 \ - --devices 0 1 --sync-sgd --optimizer sgd \ + --devices 0 1 --sync-sgd --optimizer sgd --cost-type ce-mean \ -m sync_sgd/model.full.npz -t $MRT_DATA/europarl.de-en/corpus.bpe.{en,de} -v vocab.en.yml vocab.de.yml \ --disp-freq 10 --after-batches 100 \ --log sync_sgd.log diff --git a/tests/training/multi-gpu/test_sync_sgd_1gpu.sh b/tests/training/multi-gpu/test_sync_sgd_1gpu.sh index e3a8255..2b9c72b 100644 --- a/tests/training/multi-gpu/test_sync_sgd_1gpu.sh +++ b/tests/training/multi-gpu/test_sync_sgd_1gpu.sh @@ -10,7 +10,7 @@ mkdir -p sync_sgd_1gpu $MRT_MARIAN/marian \ --no-shuffle --seed 888 --mini-batch 4 --maxi-batch 1 --maxi-batch-sort none \ --dim-rnn 64 --dim-emb 32 --learn-rate 0.1 \ - --devices 0 --sync-sgd --optimizer sgd \ + --devices 0 --sync-sgd --optimizer sgd --cost-type ce-mean \ -m sync_sgd_1gpu/model.npz -t $MRT_DATA/europarl.de-en/corpus.bpe.{en,de} -v vocab.en.yml vocab.de.yml \ --disp-freq 5 --save-freq 10 --after-batches 20 \ --log sync_sgd_1gpu.log diff --git a/tests/training/multi-gpu/test_sync_sgd_1gpu_expsmooth.sh b/tests/training/multi-gpu/test_sync_sgd_1gpu_expsmooth.sh index 510aa26..d1d77d3 100644 --- a/tests/training/multi-gpu/test_sync_sgd_1gpu_expsmooth.sh +++ b/tests/training/multi-gpu/test_sync_sgd_1gpu_expsmooth.sh @@ -10,7 +10,7 @@ mkdir -p sync_sgd_1gpu_expsmooth $MRT_MARIAN/marian \ --no-shuffle --seed 888 --mini-batch 4 --maxi-batch 1 --maxi-batch-sort none \ --dim-rnn 64 --dim-emb 32 --learn-rate 0.1 \ - --devices 0 --sync-sgd --optimizer sgd --exponential-smoothing \ + --devices 0 --sync-sgd --optimizer sgd --exponential-smoothing --cost-type ce-mean \ -m sync_sgd_1gpu_expsmooth/model.npz -t $MRT_DATA/europarl.de-en/corpus.bpe.{en,de} -v vocab.en.yml vocab.de.yml \ --disp-freq 5 --save-freq 10 --after-batches 20 \ --log sync_sgd_1gpu_expsmooth.log diff --git a/tests/training/restarting/test_sgd_for_two_epochs.sh b/tests/training/restarting/test_sgd_for_two_epochs.sh index abef975..ad92b5f 100644 --- a/tests/training/restarting/test_sgd_for_two_epochs.sh +++ b/tests/training/restarting/test_sgd_for_two_epochs.sh @@ -8,6 +8,8 @@ rm -rf sgd_2e sgd_1st_epoch.log sgd_2nd_epoch.log mkdir -p sgd_2e extra_opts="--no-shuffle --seed 1111 --maxi-batch 1 --maxi-batch-sort none --mini-batch 32 --optimizer sgd" +# Added because default options has changes +extra_opts="$extra_opts --cost-type ce-mean --disp-label-counts false" # Uncomment to prepare the expected output diff --git a/tests/training/restarting/test_sgd_for_two_epochs_sync.sh b/tests/training/restarting/test_sgd_for_two_epochs_sync.sh index 4808894..d3ee295 100644 --- a/tests/training/restarting/test_sgd_for_two_epochs_sync.sh +++ b/tests/training/restarting/test_sgd_for_two_epochs_sync.sh @@ -8,6 +8,8 @@ rm -rf sgd_sync_2e sgd_sync_*_epoch.log mkdir -p sgd_sync_2e extra_opts="--no-shuffle --seed 1111 --maxi-batch 1 --maxi-batch-sort none --mini-batch 32 --optimizer sgd --sync-sgd" +# Added because default options has changes +extra_opts="$extra_opts --cost-type ce-mean --disp-label-counts false" # Uncomment to prepare the expected output |