Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/moses-smt/mosesdecoder.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
Diffstat (limited to 'scripts/training/wrappers')
-rwxr-xr-xscripts/training/wrappers/adam-suffix-array/suffix-array-create.sh3
-rwxr-xr-xscripts/training/wrappers/adam-suffix-array/suffix-array-extract.sh3
-rwxr-xr-xscripts/training/wrappers/berkeleyparsed2mosesxml.perl3
-rwxr-xr-xscripts/training/wrappers/berkeleyparsed2mosesxml_PTB.perl3
-rwxr-xr-xscripts/training/wrappers/conll2mosesxml.py3
-rwxr-xr-xscripts/training/wrappers/filter-excluded-lines.perl3
-rwxr-xr-xscripts/training/wrappers/find-unparseable.perl3
-rwxr-xr-xscripts/training/wrappers/mada-wrapper.perl3
-rwxr-xr-xscripts/training/wrappers/madamira-tok.perl3
-rwxr-xr-xscripts/training/wrappers/madamira-wrapper.perl3
-rwxr-xr-xscripts/training/wrappers/make-factor-brown-cluster-mkcls.perl3
-rwxr-xr-xscripts/training/wrappers/make-factor-de-lemma.perl3
-rwxr-xr-xscripts/training/wrappers/make-factor-de-morph.perl3
-rwxr-xr-xscripts/training/wrappers/make-factor-de-pos.perl3
-rwxr-xr-xscripts/training/wrappers/make-factor-en-porter.perl3
-rwxr-xr-xscripts/training/wrappers/make-factor-en-pos.mxpost.perl3
-rwxr-xr-xscripts/training/wrappers/make-factor-pos.tree-tagger.perl3
-rwxr-xr-xscripts/training/wrappers/make-factor-stem.perl3
-rwxr-xr-xscripts/training/wrappers/make-factor-suffix.perl3
-rwxr-xr-xscripts/training/wrappers/morfessor-wrapper.perl3
-rwxr-xr-xscripts/training/wrappers/mosesxml2berkeleyparsed.perl3
-rwxr-xr-xscripts/training/wrappers/mosesxml2brackets.py5
-rwxr-xr-xscripts/training/wrappers/parse-de-berkeley.perl3
-rwxr-xr-xscripts/training/wrappers/parse-de-bitpar.perl3
-rwxr-xr-xscripts/training/wrappers/parse-en-collins.perl3
-rwxr-xr-xscripts/training/wrappers/parse-en-egret.perl3
-rwxr-xr-xscripts/training/wrappers/parse-en-senna.perl3
-rwxr-xr-xscripts/training/wrappers/parse-en-stanford.py12
-rwxr-xr-xscripts/training/wrappers/senna2brackets.py33
-rwxr-xr-xscripts/training/wrappers/syntax-hyphen-splitting.perl3
-rwxr-xr-xscripts/training/wrappers/tagger-german-chunk.perl3
31 files changed, 116 insertions, 18 deletions
diff --git a/scripts/training/wrappers/adam-suffix-array/suffix-array-create.sh b/scripts/training/wrappers/adam-suffix-array/suffix-array-create.sh
index 238a53349..5db5e9aa9 100755
--- a/scripts/training/wrappers/adam-suffix-array/suffix-array-create.sh
+++ b/scripts/training/wrappers/adam-suffix-array/suffix-array-create.sh
@@ -1,4 +1,7 @@
#!/bin/bash
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
# execute: ~/workspace/bin/moses-smt/scripts/training/wrappers/suffix-array-create.sh $SA_EXEC_DIR $SOURCE_CORPUS $TARGET_CORPUS $ALIGNMENT $SA_OUTPUT
diff --git a/scripts/training/wrappers/adam-suffix-array/suffix-array-extract.sh b/scripts/training/wrappers/adam-suffix-array/suffix-array-extract.sh
index 8c255b1b6..128ccaa9e 100755
--- a/scripts/training/wrappers/adam-suffix-array/suffix-array-extract.sh
+++ b/scripts/training/wrappers/adam-suffix-array/suffix-array-extract.sh
@@ -1,4 +1,7 @@
#!/bin/bash
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
# execute: ~/workspace/bin/moses-smt/scripts/training/wrappers/adam-suffix-array/suffix-array-extract.sh $SA_EXEC_DIR $MODEL_DIR $INPUT_FILE $OUTPUT_DIR
diff --git a/scripts/training/wrappers/berkeleyparsed2mosesxml.perl b/scripts/training/wrappers/berkeleyparsed2mosesxml.perl
index 232cfefab..9c376200c 100755
--- a/scripts/training/wrappers/berkeleyparsed2mosesxml.perl
+++ b/scripts/training/wrappers/berkeleyparsed2mosesxml.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/berkeleyparsed2mosesxml_PTB.perl b/scripts/training/wrappers/berkeleyparsed2mosesxml_PTB.perl
index 9e8c30d42..b8ba146c9 100755
--- a/scripts/training/wrappers/berkeleyparsed2mosesxml_PTB.perl
+++ b/scripts/training/wrappers/berkeleyparsed2mosesxml_PTB.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/conll2mosesxml.py b/scripts/training/wrappers/conll2mosesxml.py
index 761037488..6473166d9 100755
--- a/scripts/training/wrappers/conll2mosesxml.py
+++ b/scripts/training/wrappers/conll2mosesxml.py
@@ -1,6 +1,9 @@
#!/usr/bin/env python
# -*- coding: utf-8 -*-
# Author: Rico Sennrich
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
"""
Takes a file in the CoNLL dependency format (from the CoNLL-X shared task on
diff --git a/scripts/training/wrappers/filter-excluded-lines.perl b/scripts/training/wrappers/filter-excluded-lines.perl
index dff104dba..508ab8a06 100755
--- a/scripts/training/wrappers/filter-excluded-lines.perl
+++ b/scripts/training/wrappers/filter-excluded-lines.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/find-unparseable.perl b/scripts/training/wrappers/find-unparseable.perl
index 00009e2e9..fd0664f1d 100755
--- a/scripts/training/wrappers/find-unparseable.perl
+++ b/scripts/training/wrappers/find-unparseable.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/mada-wrapper.perl b/scripts/training/wrappers/mada-wrapper.perl
index f2cf14f40..d4124e34c 100755
--- a/scripts/training/wrappers/mada-wrapper.perl
+++ b/scripts/training/wrappers/mada-wrapper.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/madamira-tok.perl b/scripts/training/wrappers/madamira-tok.perl
index 37e70079e..e9f19d53a 100755
--- a/scripts/training/wrappers/madamira-tok.perl
+++ b/scripts/training/wrappers/madamira-tok.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/madamira-wrapper.perl b/scripts/training/wrappers/madamira-wrapper.perl
index 6535b6187..05ec44d7d 100755
--- a/scripts/training/wrappers/madamira-wrapper.perl
+++ b/scripts/training/wrappers/madamira-wrapper.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/make-factor-brown-cluster-mkcls.perl b/scripts/training/wrappers/make-factor-brown-cluster-mkcls.perl
index 1e3a1ce3f..a8ce5f24e 100755
--- a/scripts/training/wrappers/make-factor-brown-cluster-mkcls.perl
+++ b/scripts/training/wrappers/make-factor-brown-cluster-mkcls.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/make-factor-de-lemma.perl b/scripts/training/wrappers/make-factor-de-lemma.perl
index db978317e..0b93002a9 100755
--- a/scripts/training/wrappers/make-factor-de-lemma.perl
+++ b/scripts/training/wrappers/make-factor-de-lemma.perl
@@ -1,4 +1,7 @@
#!/usr/bin/perl -w
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use strict;
use Encode;
diff --git a/scripts/training/wrappers/make-factor-de-morph.perl b/scripts/training/wrappers/make-factor-de-morph.perl
index 366a5a76d..d09196745 100755
--- a/scripts/training/wrappers/make-factor-de-morph.perl
+++ b/scripts/training/wrappers/make-factor-de-morph.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/make-factor-de-pos.perl b/scripts/training/wrappers/make-factor-de-pos.perl
index 495517352..585323bd4 100755
--- a/scripts/training/wrappers/make-factor-de-pos.perl
+++ b/scripts/training/wrappers/make-factor-de-pos.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/make-factor-en-porter.perl b/scripts/training/wrappers/make-factor-en-porter.perl
index 749dc1318..7ae5fd0b3 100755
--- a/scripts/training/wrappers/make-factor-en-porter.perl
+++ b/scripts/training/wrappers/make-factor-en-porter.perl
@@ -1,4 +1,7 @@
#!/usr/bin/perl -w
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use strict;
use FindBin qw($RealBin);
diff --git a/scripts/training/wrappers/make-factor-en-pos.mxpost.perl b/scripts/training/wrappers/make-factor-en-pos.mxpost.perl
index 4aa66bac6..2bff8e329 100755
--- a/scripts/training/wrappers/make-factor-en-pos.mxpost.perl
+++ b/scripts/training/wrappers/make-factor-en-pos.mxpost.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/make-factor-pos.tree-tagger.perl b/scripts/training/wrappers/make-factor-pos.tree-tagger.perl
index 0ad04d4de..1e8ccd0ee 100755
--- a/scripts/training/wrappers/make-factor-pos.tree-tagger.perl
+++ b/scripts/training/wrappers/make-factor-pos.tree-tagger.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/make-factor-stem.perl b/scripts/training/wrappers/make-factor-stem.perl
index 662f1d882..9bde7648f 100755
--- a/scripts/training/wrappers/make-factor-stem.perl
+++ b/scripts/training/wrappers/make-factor-stem.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/make-factor-suffix.perl b/scripts/training/wrappers/make-factor-suffix.perl
index 6a59254e4..015df3874 100755
--- a/scripts/training/wrappers/make-factor-suffix.perl
+++ b/scripts/training/wrappers/make-factor-suffix.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/morfessor-wrapper.perl b/scripts/training/wrappers/morfessor-wrapper.perl
index c65a2cebc..0269045a0 100755
--- a/scripts/training/wrappers/morfessor-wrapper.perl
+++ b/scripts/training/wrappers/morfessor-wrapper.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/mosesxml2berkeleyparsed.perl b/scripts/training/wrappers/mosesxml2berkeleyparsed.perl
index e929658ff..02bc7b88e 100755
--- a/scripts/training/wrappers/mosesxml2berkeleyparsed.perl
+++ b/scripts/training/wrappers/mosesxml2berkeleyparsed.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/mosesxml2brackets.py b/scripts/training/wrappers/mosesxml2brackets.py
index 6ff1d20c9..6b90aa256 100755
--- a/scripts/training/wrappers/mosesxml2brackets.py
+++ b/scripts/training/wrappers/mosesxml2brackets.py
@@ -1,8 +1,11 @@
#!/usr/bin/env python
# -*- coding: utf-8 -*-
# Author: Rico Sennrich
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
-# convert trees in moses XML format to PTB-style bracketed format
+"""Convert trees in moses XML format to PTB-style bracketed format."""
from __future__ import print_function, unicode_literals
import sys
diff --git a/scripts/training/wrappers/parse-de-berkeley.perl b/scripts/training/wrappers/parse-de-berkeley.perl
index 596fb3eff..f605a37ae 100755
--- a/scripts/training/wrappers/parse-de-berkeley.perl
+++ b/scripts/training/wrappers/parse-de-berkeley.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/parse-de-bitpar.perl b/scripts/training/wrappers/parse-de-bitpar.perl
index 1bbcf5329..0d5346058 100755
--- a/scripts/training/wrappers/parse-de-bitpar.perl
+++ b/scripts/training/wrappers/parse-de-bitpar.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/parse-en-collins.perl b/scripts/training/wrappers/parse-en-collins.perl
index 252d3d2b7..c9a960912 100755
--- a/scripts/training/wrappers/parse-en-collins.perl
+++ b/scripts/training/wrappers/parse-en-collins.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/parse-en-egret.perl b/scripts/training/wrappers/parse-en-egret.perl
index 9f434063b..e97bc1ae0 100755
--- a/scripts/training/wrappers/parse-en-egret.perl
+++ b/scripts/training/wrappers/parse-en-egret.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/parse-en-senna.perl b/scripts/training/wrappers/parse-en-senna.perl
index f271633ea..2df46284b 100755
--- a/scripts/training/wrappers/parse-en-senna.perl
+++ b/scripts/training/wrappers/parse-en-senna.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use strict;
use warnings;
diff --git a/scripts/training/wrappers/parse-en-stanford.py b/scripts/training/wrappers/parse-en-stanford.py
index 7d8be4bcf..06b027e55 100755
--- a/scripts/training/wrappers/parse-en-stanford.py
+++ b/scripts/training/wrappers/parse-en-stanford.py
@@ -1,11 +1,17 @@
#!/usr/bin/python
# -*- coding: utf-8 -*-
# Author: Rico Sennrich
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
-# (hacky) wrapper around Stanford CoreNLP to produce CoNLL dependency format.
-# assumes tokenized and sentence-split text.
+"""
+(Hacky) wrapper around Stanford CoreNLP to produce CoNLL dependency format.
+Assumes tokenized and sentence-split text.
-# to get Moses XML format, first projectivize the trees, then use conll2mosesxml.py.
+To get Moses XML format, first projectivize the trees, then use
+conll2mosesxml.py.
+"""
from __future__ import print_function, unicode_literals
import os
diff --git a/scripts/training/wrappers/senna2brackets.py b/scripts/training/wrappers/senna2brackets.py
index 4fc71ed44..a81100277 100755
--- a/scripts/training/wrappers/senna2brackets.py
+++ b/scripts/training/wrappers/senna2brackets.py
@@ -1,19 +1,24 @@
#!/usr/bin/env python
-
-# Read SENNA output (from stdin), extract the parse trees, and write them in
-# PTB-style bracketed format (to stdout).
-#
-# The SENNA output is assumed to contain tokens in the first column, POS tags
-# in the second column, and PSG fragments in the final column.
-#
-# It is also assumed that SENNA was run through the parse-en-senna.perl wrapper,
-# which:
#
-# - Substitutes the special "SENTENCE_TOO_LONG" token for sentences that
-# exceed SENNA's hardcoded limit.
-#
-# - Replaces the bracket-like tokens "-LRB-", "-RRB-", etc. with "(", ")",
-# etc.
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
+
+"""
+Read SENNA output (from stdin), extract the parse trees, and write them in
+PTB-style bracketed format (to stdout).
+
+The SENNA output is assumed to contain tokens in the first column, POS tags
+in the second column, and PSG fragments in the final column.
+
+It is also assumed that SENNA was run through the parse-en-senna.perl wrapper,
+which:
+
+ - Substitutes the special "SENTENCE_TOO_LONG" token for sentences that
+ exceed SENNA's hardcoded limit.
+
+ - Replaces the bracket-like tokens "-LRB-", "-RRB-", etc. with "(", ")",
+ etc.
+"""
import optparse
import os
diff --git a/scripts/training/wrappers/syntax-hyphen-splitting.perl b/scripts/training/wrappers/syntax-hyphen-splitting.perl
index 653b410d0..1a260df10 100755
--- a/scripts/training/wrappers/syntax-hyphen-splitting.perl
+++ b/scripts/training/wrappers/syntax-hyphen-splitting.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;
diff --git a/scripts/training/wrappers/tagger-german-chunk.perl b/scripts/training/wrappers/tagger-german-chunk.perl
index c57031889..0b707a579 100755
--- a/scripts/training/wrappers/tagger-german-chunk.perl
+++ b/scripts/training/wrappers/tagger-german-chunk.perl
@@ -1,4 +1,7 @@
#!/usr/bin/env perl
+#
+# This file is part of moses. Its use is licensed under the GNU Lesser General
+# Public License version 2.1 or, at your option, any later version.
use warnings;
use strict;