Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/moses-smt/mosesdecoder.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorBarry Haddow <barry.haddow@gmail.com>2019-11-08 18:36:22 +0300
committerBarry Haddow <barry.haddow@gmail.com>2019-11-08 18:36:22 +0300
commit74d54b54c32dfebcbdc5f4447ce755e3e0232655 (patch)
treed31bced34e87d843a0e52866d489055a8e635940
parent103707002699a1e114a2f45c1ef1c2b20a981964 (diff)
2 letter codes
-rwxr-xr-xscripts/ems/support/split-sentences.perl4
-rw-r--r--scripts/share/nonbreaking_prefixes/nonbreaking_prefix.as (renamed from scripts/share/nonbreaking_prefixes/nonbreaking_prefix.asm)0
-rw-r--r--scripts/share/nonbreaking_prefixes/nonbreaking_prefix.or (renamed from scripts/share/nonbreaking_prefixes/nonbreaking_prefix.ory)0
3 files changed, 2 insertions, 2 deletions
diff --git a/scripts/ems/support/split-sentences.perl b/scripts/ems/support/split-sentences.perl
index 38d56e0d6..40de88fdf 100755
--- a/scripts/ems/support/split-sentences.perl
+++ b/scripts/ems/support/split-sentences.perl
@@ -126,10 +126,10 @@ sub preprocess {
my $sentence_start = "\\p{IsUpper}0-9";
$sentence_start .= "\\p{Block: Devanagari}\\p{Block: Devanagari_Extended}" if ($language eq "hi" || $language eq "mr");
$sentence_start .= "\\p{Block: Gujarati}" if $language eq "gu";
- $sentence_start .= "\\p{Block: Bengali}" if ($language eq "asm" || $language eq "bn" || $language eq "mni");
+ $sentence_start .= "\\p{Block: Bengali}" if ($language eq "as" || $language eq "bn" || $language eq "mni");
$sentence_start .= "\\p{Block: Kannada}" if $language eq "kn";
$sentence_start .= "\\p{Block: Malayalam}" if $language eq "ml";
- $sentence_start .= "\\p{Block: Oriya}" if $language eq "ory";
+ $sentence_start .= "\\p{Block: Oriya}" if $language eq "or";
$sentence_start .= "\\p{Block: Gurmukhi}" if $language eq "pa";
$sentence_start .= "\\p{Block: Tamil}" if $language eq "ta";
$sentence_start .= "\\p{Block: Telugu}" if $language eq "te";
diff --git a/scripts/share/nonbreaking_prefixes/nonbreaking_prefix.asm b/scripts/share/nonbreaking_prefixes/nonbreaking_prefix.as
index 866ee158a..866ee158a 100644
--- a/scripts/share/nonbreaking_prefixes/nonbreaking_prefix.asm
+++ b/scripts/share/nonbreaking_prefixes/nonbreaking_prefix.as
diff --git a/scripts/share/nonbreaking_prefixes/nonbreaking_prefix.ory b/scripts/share/nonbreaking_prefixes/nonbreaking_prefix.or
index 8442c0b77..8442c0b77 100644
--- a/scripts/share/nonbreaking_prefixes/nonbreaking_prefix.ory
+++ b/scripts/share/nonbreaking_prefixes/nonbreaking_prefix.or