本文整理汇总了C++中PhraseTable::normalize方法的典型用法代码示例。如果您正苦于以下问题:C++ PhraseTable::normalize方法的具体用法?C++ PhraseTable::normalize怎么用?C++ PhraseTable::normalize使用的例子?那么, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在类PhraseTable
的用法示例。
在下文中一共展示了PhraseTable::normalize方法的1个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的C++代码示例。
示例1: extractPhrase
void extractPhrase(JKArgs& args)
{
if(!args.is_set("src")||!args.is_set("tar")||!args.is_set("align"))
usage();
ifstream fsrc(args.value("src").c_str()),ftar(args.value("tar").c_str()),falign(args.value("align").c_str());
ifstream fweight;
ofstream os;
double threshold=0;
if(args.is_set("threshold"))threshold=atof(args.value("threshold").c_str());
if(args.is_set("o"))os.open(args.value("o").c_str());
if(args.is_set("w"))fweight.open(args.value("w").c_str());
Dic<double> s2tLexDic,t2sLexDic;
if(!args.is_set("s2tLex")||!args.is_set("t2sLex"))
{
cerr<<"making lex dic on the fly"<<endl;
makeLexDic(args.value("src"),args.value("tar"),args.value("align"),args.value("w"),s2tLexDic,t2sLexDic);
}
else
{
s2tLexDic.load(args.value("s2tLex"));
t2sLexDic.load(args.value("t2sLex"));
}
bool reverse=false,normalize=false;
bool moore=false;
if(args.is_set("moore"))if(args.value("moore")=="true")moore=true;
if(args.is_set("reverse"))
reverse=true;
if(args.is_set("normalize"))
if(args.value("normalize")=="true")
normalize=true;
int srcLengthLimit=8,tarLengthLimit=12;
if(args.is_set("srcLengthLimit"))
srcLengthLimit=atoi(args.value("srcLengthLimit").c_str());
if(args.is_set("tarLengthLimit"))
tarLengthLimit=atoi(args.value("tarLengthLimit").c_str());
int maxNumOfUnAlignedWords=2;
if(args.is_set("maxNumOfUnAlignedWords"))
maxNumOfUnAlignedWords=atoi(args.value("maxNumOfUnAlignedWords").c_str());
double start=1,stop=1E10;
if(args.is_set("range"))
{
string range=args.value("range");
start=atoi(range.substr(0,range.find("-")).c_str());
stop=atof(range.substr(range.find("-")+1).c_str());
cerr<<"start:"<<start<<",stop:"<<stop<<endl;
}
PhraseTable phraseTable;
int count=0;
while(!falign.eof())
{
string align="",src="",tar="";
double weight=1;
getline(falign,align);
getline(fsrc,src);
getline(ftar,tar);
if(fweight.good())fweight>>weight;
//Alignment alignment(align,maxNumOfUnAlignedWords);
count++;
if(count<start)continue;
if(count>stop)break;
if(weight==0||weight<threshold)continue;
if(moore)weight=1;
vector<PhraseRuleEntry> phrases;
phraseExtractor(src,tar,align,s2tLexDic,t2sLexDic,phrases,srcLengthLimit,tarLengthLimit,maxNumOfUnAlignedWords,weight);
for(size_t i=0;i<phrases.size();i++)
{
PhraseRuleEntry& pre=phrases[i];
if(reverse)
{
string tmp=pre.srcPhrase;
pre.srcPhrase=pre.tarPhrase;
pre.tarPhrase=tmp;
}
if(os.good())phraseTable.add(pre.srcPhrase,pre.tarPhrase,pre);
}
}
if(args.is_set("printTopEntrys"))
{
int topN=atoi(args.value("printTopEntrys").c_str());
phraseTable.printTopEntrys(topN,"topEntrys.txt");
}
if(normalize)
phraseTable.normalize();
bool onlyonefeat=false;
if(args.is_set("onlyonefeat"))
onlyonefeat=true;
if(os.good())phraseTable.print(os,onlyonefeat);
string signal="mftsignal";
if(args.is_set("signal"))signal=args.value("signal");
ofstream o_sg(signal.c_str());
o_sg.close();
}