diff options
author | Roman Grundkiewicz <rgrundkiewicz@gmail.com> | 2020-11-12 22:23:12 +0300 |
---|---|---|
committer | Roman Grundkiewicz <rgrundkiewicz@gmail.com> | 2020-11-12 22:23:12 +0300 |
commit | 8766bda24335590fb1ddade32e4e22f9788bc5f9 (patch) | |
tree | 3ddf112d78e49161dbe3bda9c84e6f5019e17416 /tests | |
parent | d6984d545a883ec74406e048f0db0abf581294cf (diff) |
Use clip-norm 0 in training/models/
Diffstat (limited to 'tests')
-rw-r--r-- | tests/training/models/lm/lm-transformer.expected | 10 | ||||
-rw-r--r-- | tests/training/models/lm/lm-transformer.scores.expected | 20 | ||||
-rw-r--r-- | tests/training/models/lm/lm.expected | 10 | ||||
-rw-r--r-- | tests/training/models/lm/lm.scores.expected | 20 | ||||
-rw-r--r-- | tests/training/models/lm/test_lm-transformer.sh | 2 | ||||
-rw-r--r-- | tests/training/models/lm/test_lm.sh | 2 | ||||
-rw-r--r-- | tests/training/models/multi-source/multi-s2s.expected | 10 | ||||
-rw-r--r-- | tests/training/models/multi-source/multi-transformer.expected | 10 | ||||
-rw-r--r-- | tests/training/models/multi-source/test_multi-s2s.sh | 2 | ||||
-rw-r--r-- | tests/training/models/multi-source/test_multi-transformer.sh | 2 | ||||
-rw-r--r-- | tests/training/models/transformer/test_transformer.sh | 2 | ||||
-rw-r--r-- | tests/training/models/transformer/transformer.expected | 20 |
12 files changed, 55 insertions, 55 deletions
diff --git a/tests/training/models/lm/lm-transformer.expected b/tests/training/models/lm/lm-transformer.expected index a5e9556..593d94e 100644 --- a/tests/training/models/lm/lm-transformer.expected +++ b/tests/training/models/lm/lm-transformer.expected @@ -1,5 +1,5 @@ -405.95352173 -277.85601807 -198.49377441 -135.86233521 -74.85224152 +406.14587402 +279.24975586 +201.01249695 +139.34625244 +78.13222504 diff --git a/tests/training/models/lm/lm-transformer.scores.expected b/tests/training/models/lm/lm-transformer.scores.expected index d40b653..ed3599e 100644 --- a/tests/training/models/lm/lm-transformer.scores.expected +++ b/tests/training/models/lm/lm-transformer.scores.expected @@ -1,10 +1,10 @@ --90.117882 --179.877197 --81.371750 --204.165802 --636.969482 --131.934113 --359.475616 --56.732944 --68.373947 --100.774132 +-94.390747 +-187.140671 +-85.050323 +-211.180054 +-645.849121 +-136.817657 +-366.460815 +-57.487789 +-72.613792 +-102.306747 diff --git a/tests/training/models/lm/lm.expected b/tests/training/models/lm/lm.expected index c6b5c74..dc0ae65 100644 --- a/tests/training/models/lm/lm.expected +++ b/tests/training/models/lm/lm.expected @@ -1,5 +1,5 @@ -410.02645874 -306.52648926 -233.58132935 -167.19117737 -91.86805725 +410.03164673 +306.58309937 +233.76004028 +167.80232239 +92.23210144 diff --git a/tests/training/models/lm/lm.scores.expected b/tests/training/models/lm/lm.scores.expected index 9ea8ae4..b42cd9b 100644 --- a/tests/training/models/lm/lm.scores.expected +++ b/tests/training/models/lm/lm.scores.expected @@ -1,10 +1,10 @@ --114.927658 --208.074463 --102.252083 --244.505508 --677.256836 --154.783279 --411.580017 --58.307816 --89.968994 --111.055710 +-114.125137 +-206.581238 +-101.570534 +-242.844177 +-673.484863 +-153.583893 +-409.248169 +-57.871357 +-89.267410 +-110.574005 diff --git a/tests/training/models/lm/test_lm-transformer.sh b/tests/training/models/lm/test_lm-transformer.sh index 476c2e2..aa2188c 100644 --- a/tests/training/models/lm/test_lm-transformer.sh +++ b/tests/training/models/lm/test_lm-transformer.sh @@ -14,7 +14,7 @@ rm -rf lm-transformer lm-transformer.log mkdir -p lm-transformer $MRT_MARIAN/marian \ - --seed 1111 --no-shuffle \ + --seed 1111 --no-shuffle --clip-norm 0 \ --type lm-transformer --dim-emb 128 --dim-rnn 256 --cost-type ce-mean \ -m lm-transformer/model.npz -t $MRT_DATA/europarl.de-en/corpus.bpe.en -v vocab.en.yml \ --disp-freq 20 --after-batches 100 \ diff --git a/tests/training/models/lm/test_lm.sh b/tests/training/models/lm/test_lm.sh index 91f94d4..f55e860 100644 --- a/tests/training/models/lm/test_lm.sh +++ b/tests/training/models/lm/test_lm.sh @@ -14,7 +14,7 @@ rm -rf lm lm.log mkdir -p lm $MRT_MARIAN/marian \ - --seed 1111 --no-shuffle \ + --seed 1111 --no-shuffle --clip-norm 0 \ --type lm --dim-emb 128 --dim-rnn 256 --cost-type ce-mean \ -m lm/model.npz -t $MRT_DATA/europarl.de-en/corpus.bpe.en -v vocab.en.yml \ --disp-freq 20 --after-batches 100 \ diff --git a/tests/training/models/multi-source/multi-s2s.expected b/tests/training/models/multi-source/multi-s2s.expected index 61608c4..2258c02 100644 --- a/tests/training/models/multi-source/multi-s2s.expected +++ b/tests/training/models/multi-source/multi-s2s.expected @@ -1,5 +1,5 @@ -388.14068604 -279.26577759 -198.44155884 -137.92988586 -75.97171021 +388.15350342 +278.90570068 +197.63183594 +137.78120422 +76.32478333 diff --git a/tests/training/models/multi-source/multi-transformer.expected b/tests/training/models/multi-source/multi-transformer.expected index 35c5e4b..538ed15 100644 --- a/tests/training/models/multi-source/multi-transformer.expected +++ b/tests/training/models/multi-source/multi-transformer.expected @@ -1,5 +1,5 @@ -382.23056030 -264.14666748 -193.33871460 -133.58370972 -71.43719482 +382.69680786 +265.52267456 +196.04469299 +138.10417175 +75.06012726 diff --git a/tests/training/models/multi-source/test_multi-s2s.sh b/tests/training/models/multi-source/test_multi-s2s.sh index a1ceef1..52c3ded 100644 --- a/tests/training/models/multi-source/test_multi-s2s.sh +++ b/tests/training/models/multi-source/test_multi-s2s.sh @@ -14,7 +14,7 @@ rm -rf multi-s2s multi-s2s.log mkdir -p multi-s2s $MRT_MARIAN/marian \ - --seed 1111 --no-shuffle \ + --seed 1111 --no-shuffle --clip-norm 0 \ --type multi-s2s --dim-emb 128 --dim-rnn 256 --cost-type ce-mean \ -m multi-s2s/model.npz -t train.bpe.{en,xx,de} -v vocab.en.yml vocab.xx.yml vocab.de.yml \ --disp-freq 20 --after-batches 100 \ diff --git a/tests/training/models/multi-source/test_multi-transformer.sh b/tests/training/models/multi-source/test_multi-transformer.sh index 425ebdc..e41d918 100644 --- a/tests/training/models/multi-source/test_multi-transformer.sh +++ b/tests/training/models/multi-source/test_multi-transformer.sh @@ -14,7 +14,7 @@ rm -rf multi-transformer multi-transformer.log mkdir -p multi-transformer $MRT_MARIAN/marian \ - --seed 1111 --no-shuffle \ + --seed 1111 --no-shuffle --clip-norm 0 \ --type multi-transformer --dim-emb 128 --dim-rnn 256 --cost-type ce-mean \ -m multi-transformer/model.npz -t train.bpe.{en,xx,de} -v vocab.en.yml vocab.xx.yml vocab.de.yml \ --disp-freq 20 --after-batches 100 \ diff --git a/tests/training/models/transformer/test_transformer.sh b/tests/training/models/transformer/test_transformer.sh index b1ad881..41870a4 100644 --- a/tests/training/models/transformer/test_transformer.sh +++ b/tests/training/models/transformer/test_transformer.sh @@ -7,7 +7,7 @@ set -e rm -rf transformer transformer*.log mkdir -p transformer -opts="--no-shuffle --seed 1111 --mini-batch 32 --maxi-batch 1 --maxi-batch-sort none --optimizer sgd --dim-emb 64 --dim-rnn 128 --cost-type ce-mean" +opts="--no-shuffle --clip-norm 0 --seed 1111 --mini-batch 32 --maxi-batch 1 --maxi-batch-sort none --optimizer sgd --dim-emb 64 --dim-rnn 128 --cost-type ce-mean" $MRT_MARIAN/marian \ --type transformer -m transformer/model.npz -t $MRT_DATA/europarl.de-en/corpus.bpe.{en,de} -v vocab.en.yml vocab.de.yml \ diff --git a/tests/training/models/transformer/transformer.expected b/tests/training/models/transformer/transformer.expected index 50d85ee..28778b1 100644 --- a/tests/training/models/transformer/transformer.expected +++ b/tests/training/models/transformer/transformer.expected @@ -1,10 +1,10 @@ -236.04219055 -260.96929932 -254.12194824 -257.51263428 -253.00631714 -248.38674927 -245.93569946 -240.78047180 -248.01782227 -252.18527222 +226.79606628 +235.31921387 +219.17929077 +216.75386047 +210.01785278 +203.72079468 +198.40823364 +190.92230225 +195.92117310 +199.06428528 |