|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#pragma once |
|
|
|
namespace MosesTraining |
|
{ |
|
|
|
struct RuleExtractionOptions { |
|
public: |
|
int maxSpan; |
|
int minHoleSource; |
|
int minHoleTarget; |
|
int minWords; |
|
int maxSymbolsTarget; |
|
int maxSymbolsSource; |
|
int maxNonTerm; |
|
int maxScope; |
|
bool onlyDirectFlag; |
|
bool glueGrammarFlag; |
|
bool unknownWordLabelFlag; |
|
bool onlyOutputSpanInfo; |
|
bool noFileLimit; |
|
bool properConditioning; |
|
bool nonTermFirstWord; |
|
bool nonTermConsecTarget; |
|
bool nonTermConsecSource; |
|
bool requireAlignedWord; |
|
bool sourceSyntax; |
|
bool targetSyntax; |
|
bool targetSyntacticPreferences; |
|
bool duplicateRules; |
|
bool fractionalCounting; |
|
bool pcfgScore; |
|
bool gzOutput; |
|
bool unpairedExtractFormat; |
|
bool conditionOnTargetLhs; |
|
bool boundaryRules; |
|
bool flexScoreFlag; |
|
bool phraseOrientation; |
|
|
|
RuleExtractionOptions() |
|
: maxSpan(10) |
|
, minHoleSource(2) |
|
, minHoleTarget(1) |
|
, minWords(1) |
|
, maxSymbolsTarget(999) |
|
, maxSymbolsSource(5) |
|
, maxNonTerm(2) |
|
, maxScope(999) |
|
|
|
|
|
, onlyDirectFlag(false) |
|
, glueGrammarFlag(false) |
|
, unknownWordLabelFlag(false) |
|
, onlyOutputSpanInfo(false) |
|
, noFileLimit(false) |
|
|
|
, properConditioning(false) |
|
, nonTermFirstWord(true) |
|
, nonTermConsecTarget(true) |
|
, nonTermConsecSource(false) |
|
, requireAlignedWord(true) |
|
, sourceSyntax(false) |
|
, targetSyntax(false) |
|
, targetSyntacticPreferences(false) |
|
, duplicateRules(true) |
|
, fractionalCounting(true) |
|
, pcfgScore(false) |
|
, gzOutput(false) |
|
, unpairedExtractFormat(false) |
|
, conditionOnTargetLhs(false) |
|
, boundaryRules(false) |
|
, flexScoreFlag(false) |
|
, phraseOrientation(false) {} |
|
}; |
|
|
|
} |
|
|
|
|