diff options
author | bgottesman <bgottesman@1f5c12ca-751b-0410-a591-d2e778427230> | 2011-08-08 17:21:05 +0400 |
---|---|---|
committer | bgottesman <bgottesman@1f5c12ca-751b-0410-a591-d2e778427230> | 2011-08-08 17:21:05 +0400 |
commit | 9d9977bc6f8e52c9c3a0ea20fa15eede98661de2 (patch) | |
tree | 91acda0e6ff1ec9631f103841389b6bdecb76058 /regression-testing | |
parent | c030dae094632972ea1d69c03735d10a57f2c1e9 (diff) |
add TODO tests for detokenization of Chinese and Japanese
git-svn-id: https://mosesdecoder.svn.sourceforge.net/svnroot/mosesdecoder/trunk@4131 1f5c12ca-751b-0410-a591-d2e778427230
Diffstat (limited to 'regression-testing')
-rw-r--r-- | regression-testing/run-test-detokenizer.t | 39 |
1 files changed, 37 insertions, 2 deletions
diff --git a/regression-testing/run-test-detokenizer.t b/regression-testing/run-test-detokenizer.t index aaea9c768..f9cc3423a 100644 --- a/regression-testing/run-test-detokenizer.t +++ b/regression-testing/run-test-detokenizer.t @@ -112,6 +112,41 @@ Frau Präsidentin! Frau Díez González und ich hatten einige Anfragen EXP ); +# A (failing) simple Chinese test +{ +my $testCase = +&addDetokenizerTest("TEST_CHINESE_EASY", undef, +<<'TOK' +这 是 一个 简单 的的 汉语 句子 。 +TOK +, +<<'EXP' +这是一个简单的的汉语句子。 +EXP +); + +$testCase->setExpectedToFail("Chinese detokenization is not implemented yet."); +} + +# A (failing) simple Japanese test +{ +my $testCase = +&addDetokenizerTest("TEST_JAPANESE_EASY", undef, +<<'TOK' +どう しょ う か な 。 +どこ で 食べ たい 。 +TOK +, +<<'EXP' +どうしょうかな。 +どこで食べたい。 +EXP +); + +$testCase->setExpectedToFail("Japanese detokenization is not implemented yet."); +} + + ###################################### # Now run those babies ... ###################################### @@ -159,7 +194,7 @@ sub runDetokenizerTest { close TRUTH; &runTest($testCase->getName(), $testOutputDir, $tokenizedFile, sub { - return defined($testCase->getLanguage())? [$detokenizer, "-l", $testCase->getLanguage()] : [$detokenizer]; + return defined($testCase->getLanguage()) ? [$detokenizer, "-l", $testCase->getLanguage()] : [$detokenizer]; }, sub { &verifyIdentical($testCase->getName(), $expectedFile, catfile($testOutputDir, "stdout.txt")) }, 1, $testCase->getFailureExplanation()); @@ -250,7 +285,7 @@ sub new { _name => shift, _language => shift, _tokenizedText => shift, - _rightAnswer => shift, + _rightAnswer => shift, _failureExplanation => undef }; |