Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/moses-smt/mosesdecoder.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorBarry Haddow <barry.haddow@gmail.com>2019-11-08 18:36:22 +0300
committerBarry Haddow <barry.haddow@gmail.com>2019-11-08 18:36:22 +0300
commit74d54b54c32dfebcbdc5f4447ce755e3e0232655 (patch)
treed31bced34e87d843a0e52866d489055a8e635940 /scripts/ems/support
parent103707002699a1e114a2f45c1ef1c2b20a981964 (diff)
2 letter codes
Diffstat (limited to 'scripts/ems/support')
-rwxr-xr-xscripts/ems/support/split-sentences.perl4
1 files changed, 2 insertions, 2 deletions
diff --git a/scripts/ems/support/split-sentences.perl b/scripts/ems/support/split-sentences.perl
index 38d56e0d6..40de88fdf 100755
--- a/scripts/ems/support/split-sentences.perl
+++ b/scripts/ems/support/split-sentences.perl
@@ -126,10 +126,10 @@ sub preprocess {
my $sentence_start = "\\p{IsUpper}0-9";
$sentence_start .= "\\p{Block: Devanagari}\\p{Block: Devanagari_Extended}" if ($language eq "hi" || $language eq "mr");
$sentence_start .= "\\p{Block: Gujarati}" if $language eq "gu";
- $sentence_start .= "\\p{Block: Bengali}" if ($language eq "asm" || $language eq "bn" || $language eq "mni");
+ $sentence_start .= "\\p{Block: Bengali}" if ($language eq "as" || $language eq "bn" || $language eq "mni");
$sentence_start .= "\\p{Block: Kannada}" if $language eq "kn";
$sentence_start .= "\\p{Block: Malayalam}" if $language eq "ml";
- $sentence_start .= "\\p{Block: Oriya}" if $language eq "ory";
+ $sentence_start .= "\\p{Block: Oriya}" if $language eq "or";
$sentence_start .= "\\p{Block: Gurmukhi}" if $language eq "pa";
$sentence_start .= "\\p{Block: Tamil}" if $language eq "ta";
$sentence_start .= "\\p{Block: Telugu}" if $language eq "te";