Welcome to mirror list, hosted at ThFree Co, Russian Federation.

test_templated_valid_translation_output.sh « validation « training « tests - github.com/marian-nmt/marian-regression-tests.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
blob: 2f4204c70c36ab4912f24c8669506d76cdc093f1 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
#!/bin/bash -x

#####################################################################
# SUMMARY: Templated file names for translation outputs
# AUTHOR: snukky
#####################################################################


# Exit on error
set -e

# Remove temporary files
rm -rf template_translation template_translation.log vocab.small.*.yml valid-translation-output-*.out
mkdir -p template_translation

# Prepare training data if it doesn't exist
test -e train.bpe.en || head -n 3000 $MRT_DATA/europarl.de-en/corpus.bpe.en > train.bpe.en
test -e train.bpe.de || head -n 3000 $MRT_DATA/europarl.de-en/corpus.bpe.de > train.bpe.de


# Run Marian using --valid-translation-output with templates
$MRT_MARIAN/marian \
    --no-shuffle --seed 2222 --optimizer sgd --dim-emb 64 --dim-rnn 128 \
    -m template_translation/model.npz -t train.bpe.{en,de} \
    -v vocab.small.en.yml vocab.small.de.yml \
    --mini-batch 32 --disp-freq 20 --valid-freq 40 --after-batches 150 \
    --valid-sets valid.bpe.{en,de} \
    --valid-metrics translation \
    --valid-translation-output valid-translation-output-epoch-{E}-batch-{B}-updates-{U}-tokens-{T}.out \
    --valid-log template_translation.log

test -e template_translation.log

# Check if validation outputs have expected names
test -s valid-translation-output-epoch-1-batch-40-updates-40-tokens-41764.out
test -s valid-translation-output-epoch-1-batch-80-updates-80-tokens-60798.out
test -s valid-translation-output-epoch-2-batch-39-updates-120-tokens-101878.out


# Exit with success code
exit 0