Welcome to mirror list, hosted at ThFree Co, Russian Federation.

RuleExtractionOptions.h « phrase-extract - github.com/moses-smt/mosesdecoder.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
blob: b38258470b3ed340f1aa280a5e6a7d98077b62e5 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
/***********************************************************************
  Moses - factored phrase-based language decoder
  Copyright (C) 2010 University of Edinburgh

  This library is free software; you can redistribute it and/or
  modify it under the terms of the GNU Lesser General Public
  License as published by the Free Software Foundation; either
  version 2.1 of the License, or (at your option) any later version.

  This library is distributed in the hope that it will be useful,
  but WITHOUT ANY WARRANTY; without even the implied warranty of
  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  Lesser General Public License for more details.

  You should have received a copy of the GNU Lesser General Public
  License along with this library; if not, write to the Free Software
  Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 ***********************************************************************/

#pragma once
#ifndef RULEEXTRACTIONOPTIONS_H_INCLUDED_
#define RULEEXTRACTIONOPTIONS_H_INCLUDED_

namespace MosesTraining
{

struct RuleExtractionOptions {
public:
  int maxSpan;
  int minHoleSource;
  int minHoleTarget;
  int minWords;
  int maxSymbolsTarget;
  int maxSymbolsSource;
  int maxNonTerm;
  int maxScope;
  bool onlyDirectFlag;
  bool glueGrammarFlag;
  bool unknownWordLabelFlag;
  bool onlyOutputSpanInfo;
  bool noFileLimit;
  bool properConditioning;
  bool nonTermFirstWord;
  bool nonTermConsecTarget;
  bool nonTermConsecSource;
  bool requireAlignedWord;
  bool sourceSyntax;
  bool targetSyntax;
  bool duplicateRules;
  bool fractionalCounting;
  bool pcfgScore;
  bool gzOutput;
  bool unpairedExtractFormat;
  bool conditionOnTargetLhs;
  bool boundaryRules;
  bool flexScoreFlag;

  RuleExtractionOptions()
    : maxSpan(10)
    , minHoleSource(2)
    , minHoleTarget(1)
    , minWords(1)
    , maxSymbolsTarget(999)
    , maxSymbolsSource(5)
    , maxNonTerm(2)
    , maxScope(999)
    // int minHoleSize(1)
    // int minSubPhraseSize(1) // minimum size of a remaining lexical phrase
    , onlyDirectFlag(false)
    , glueGrammarFlag(false)
    , unknownWordLabelFlag(false)
    , onlyOutputSpanInfo(false)
    , noFileLimit(false)
    //bool zipFiles(false)
    , properConditioning(false)
    , nonTermFirstWord(true)
    , nonTermConsecTarget(true)
    , nonTermConsecSource(false)
    , requireAlignedWord(true)
    , sourceSyntax(false)
    , targetSyntax(false)
    , duplicateRules(true)
    , fractionalCounting(true)
    , pcfgScore(false)
    , gzOutput(false)
    , unpairedExtractFormat(false)
    , conditionOnTargetLhs(false)
    , boundaryRules(false)
    , flexScoreFlag(false) {}
};

}

#endif