Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/moses-smt/mosesdecoder.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorbgottesman <bgottesman@1f5c12ca-751b-0410-a591-d2e778427230>2011-08-08 17:21:05 +0400
committerbgottesman <bgottesman@1f5c12ca-751b-0410-a591-d2e778427230>2011-08-08 17:21:05 +0400
commit9d9977bc6f8e52c9c3a0ea20fa15eede98661de2 (patch)
tree91acda0e6ff1ec9631f103841389b6bdecb76058 /regression-testing
parentc030dae094632972ea1d69c03735d10a57f2c1e9 (diff)
add TODO tests for detokenization of Chinese and Japanese
git-svn-id: https://mosesdecoder.svn.sourceforge.net/svnroot/mosesdecoder/trunk@4131 1f5c12ca-751b-0410-a591-d2e778427230
Diffstat (limited to 'regression-testing')
-rw-r--r--regression-testing/run-test-detokenizer.t39
1 files changed, 37 insertions, 2 deletions
diff --git a/regression-testing/run-test-detokenizer.t b/regression-testing/run-test-detokenizer.t
index aaea9c768..f9cc3423a 100644
--- a/regression-testing/run-test-detokenizer.t
+++ b/regression-testing/run-test-detokenizer.t
@@ -112,6 +112,41 @@ Frau Präsidentin! Frau Díez González und ich hatten einige Anfragen
EXP
);
+# A (failing) simple Chinese test
+{
+my $testCase =
+&addDetokenizerTest("TEST_CHINESE_EASY", undef,
+<<'TOK'
+这 是 一个 简单 的的 汉语 句子 。
+TOK
+,
+<<'EXP'
+这是一个简单的的汉语句子。
+EXP
+);
+
+$testCase->setExpectedToFail("Chinese detokenization is not implemented yet.");
+}
+
+# A (failing) simple Japanese test
+{
+my $testCase =
+&addDetokenizerTest("TEST_JAPANESE_EASY", undef,
+<<'TOK'
+どう しょ う か な 。
+どこ で 食べ たい 。
+TOK
+,
+<<'EXP'
+どうしょうかな。
+どこで食べたい。
+EXP
+);
+
+$testCase->setExpectedToFail("Japanese detokenization is not implemented yet.");
+}
+
+
######################################
# Now run those babies ...
######################################
@@ -159,7 +194,7 @@ sub runDetokenizerTest {
close TRUTH;
&runTest($testCase->getName(), $testOutputDir, $tokenizedFile, sub {
- return defined($testCase->getLanguage())? [$detokenizer, "-l", $testCase->getLanguage()] : [$detokenizer];
+ return defined($testCase->getLanguage()) ? [$detokenizer, "-l", $testCase->getLanguage()] : [$detokenizer];
}, sub {
&verifyIdentical($testCase->getName(), $expectedFile, catfile($testOutputDir, "stdout.txt"))
}, 1, $testCase->getFailureExplanation());
@@ -250,7 +285,7 @@ sub new {
_name => shift,
_language => shift,
_tokenizedText => shift,
- _rightAnswer => shift,
+ _rightAnswer => shift,
_failureExplanation => undef
};