From a05a7f0099b17f798ddd15ae36d51796b89219d6 Mon Sep 17 00:00:00 2001 From: Roman Grundkiewicz Date: Fri, 13 Nov 2020 09:46:18 -0800 Subject: Use clip-norm 0 in training/cost-functions --- tests/training/cost-functions/ce-mean.expected | 16 ++++++++-------- tests/training/cost-functions/ce-sum.expected | 16 ++++++++-------- tests/training/cost-functions/perplexity.expected | 16 ++++++++-------- tests/training/cost-functions/test_ce-mean-words.sh | 2 +- tests/training/cost-functions/test_ce-mean.sh | 2 +- tests/training/cost-functions/test_ce-sum.sh | 2 +- tests/training/cost-functions/test_perplexity.sh | 2 +- 7 files changed, 28 insertions(+), 28 deletions(-) (limited to 'tests') diff --git a/tests/training/cost-functions/ce-mean.expected b/tests/training/cost-functions/ce-mean.expected index 99dcb2e..d2284ad 100644 --- a/tests/training/cost-functions/ce-mean.expected +++ b/tests/training/cost-functions/ce-mean.expected @@ -1,8 +1,8 @@ -150.17980957 -263.68411255 -100.49322510 -253.63926697 -274.96899414 -145.67076111 -207.88955688 -245.54043579 +150.17977905 +263.68469238 +100.50036621 +253.64115906 +274.95046997 +145.69451904 +207.82330322 +245.20465088 diff --git a/tests/training/cost-functions/ce-sum.expected b/tests/training/cost-functions/ce-sum.expected index 211f95e..bf94e75 100644 --- a/tests/training/cost-functions/ce-sum.expected +++ b/tests/training/cost-functions/ce-sum.expected @@ -1,8 +1,8 @@ -9616.72363281 -16924.73828125 -6485.94677734 -16367.00390625 -17824.65820312 -9517.77148438 -13688.55371094 -16464.12500000 +9611.53320312 +16874.39843750 +6437.13916016 +16230.42187500 +17589.32421875 +9352.28906250 +13412.98730469 +16044.14746094 diff --git a/tests/training/cost-functions/perplexity.expected b/tests/training/cost-functions/perplexity.expected index 454d690..e72030a 100644 --- a/tests/training/cost-functions/perplexity.expected +++ b/tests/training/cost-functions/perplexity.expected @@ -1,8 +1,8 @@ -4855.37011719 -4845.00927734 -4863.23437500 -4840.18750000 -4846.01660156 -4849.56250000 -4848.35107422 -4839.06152344 +4833.17675781 +4724.25634766 +4562.26855469 +4509.33154297 +4332.39013672 +4184.27783203 +4086.94750977 +3897.33496094 diff --git a/tests/training/cost-functions/test_ce-mean-words.sh b/tests/training/cost-functions/test_ce-mean-words.sh index 7c875ff..b9bb8f5 100644 --- a/tests/training/cost-functions/test_ce-mean-words.sh +++ b/tests/training/cost-functions/test_ce-mean-words.sh @@ -14,7 +14,7 @@ rm -rf ce-mean-words ce-mean-words.log mkdir -p ce-mean-words $MRT_MARIAN/marian \ - --cost-type ce-mean-words \ + --cost-type ce-mean-words --clip-norm 0 \ --seed 9999 --sync-sgd \ -m ce-mean-words/model.npz -t $MRT_DATA/train.max50.{en,de} -v vocab.en.yml vocab.de.yml \ --disp-freq 2 --after-epochs 1 \ diff --git a/tests/training/cost-functions/test_ce-mean.sh b/tests/training/cost-functions/test_ce-mean.sh index c4109b1..e1b08d2 100644 --- a/tests/training/cost-functions/test_ce-mean.sh +++ b/tests/training/cost-functions/test_ce-mean.sh @@ -14,7 +14,7 @@ rm -rf ce-mean ce-mean.log mkdir -p ce-mean $MRT_MARIAN/marian \ - --cost-type ce-mean \ + --cost-type ce-mean --clip-norm 0 \ --seed 9999 --sync-sgd \ -m ce-mean/model.npz -t $MRT_DATA/train.max50.{en,de} -v vocab.en.yml vocab.de.yml \ --disp-freq 2 --after-epochs 1 \ diff --git a/tests/training/cost-functions/test_ce-sum.sh b/tests/training/cost-functions/test_ce-sum.sh index f22f137..a3cfb04 100644 --- a/tests/training/cost-functions/test_ce-sum.sh +++ b/tests/training/cost-functions/test_ce-sum.sh @@ -14,7 +14,7 @@ rm -rf ce-sum ce-sum.log mkdir -p ce-sum $MRT_MARIAN/marian \ - --cost-type ce-sum --disp-label-counts false \ + --cost-type ce-sum --disp-label-counts false --clip-norm 0 \ --seed 9999 --optimizer sgd --sync-sgd \ -m ce-sum/model.npz -t $MRT_DATA/train.max50.{en,de} -v vocab.en.yml vocab.de.yml \ --disp-freq 2 --after-epochs 1 \ diff --git a/tests/training/cost-functions/test_perplexity.sh b/tests/training/cost-functions/test_perplexity.sh index 7a790fd..83dfb36 100644 --- a/tests/training/cost-functions/test_perplexity.sh +++ b/tests/training/cost-functions/test_perplexity.sh @@ -14,7 +14,7 @@ rm -rf perplexity perplexity.log mkdir -p perplexity $MRT_MARIAN/marian \ - --cost-type perplexity \ + --cost-type perplexity --clip-norm 0 \ --seed 9999 --optimizer sgd --sync-sgd \ -m perplexity/model.npz -t $MRT_DATA/train.max50.{en,de} -v vocab.en.yml vocab.de.yml \ --disp-freq 2 --after-epochs 1 \ -- cgit v1.2.3