diff options
Diffstat (limited to 'tests/interface/input-tsv/test_tsv_train_restore_from_stdin.sh')
-rw-r--r-- | tests/interface/input-tsv/test_tsv_train_restore_from_stdin.sh | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/tests/interface/input-tsv/test_tsv_train_restore_from_stdin.sh b/tests/interface/input-tsv/test_tsv_train_restore_from_stdin.sh index 4783e76..f8953ef 100644 --- a/tests/interface/input-tsv/test_tsv_train_restore_from_stdin.sh +++ b/tests/interface/input-tsv/test_tsv_train_restore_from_stdin.sh @@ -11,12 +11,12 @@ test -e vocab.de.yml || $MRT_MARIAN/marian-vocab < train.bpe.de > vocab.de.yml test -e vocab.en.yml || $MRT_MARIAN/marian-vocab < train.bpe.en > vocab.en.yml # TODO: Weight decaying in Adam is disabled, because it gives unstable results on GPU -extra_opts="--no-shuffle --seed 2222 --maxi-batch 1 --maxi-batch-sort none --mini-batch 16 --dim-emb 128 --dim-rnn 256 --disp-freq 2 --type s2s --sync-sgd --optimizer sgd" +extra_opts="--no-shuffle --seed 2222 --maxi-batch 1 --maxi-batch-sort none --mini-batch 16 --dim-emb 128 --dim-rnn 256 --disp-freq 2 --type s2s --sync-sgd --optimizer sgd --cost-type ce-mean" # Step 1: Train a model in one go, up to the update no. 70, and save training logs #$MRT_MARIAN/marian \ #-m restore_stdin/model_full.npz -t train.bpe.{en,de} -v vocab.en.yml vocab.de.yml \ - #--after-batches 60 $extra_opts \ + #--cost-type ce-mean --after-batches 60 $extra_opts \ #--log restore_stdin.log #test -e restore_stdin/model_full.npz |