本文整理汇总了C++中Vocabulary::read_from_dir方法的典型用法代码示例。如果您正苦于以下问题:C++ Vocabulary::read_from_dir方法的具体用法?C++ Vocabulary::read_from_dir怎么用?C++ Vocabulary::read_from_dir使用的例子?那么恭喜您, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在类Vocabulary
的用法示例。
在下文中一共展示了Vocabulary::read_from_dir方法的1个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的C++代码示例。
示例1: main
int main(int argc, char * argv[])
{
Options options = ProcessOptions(argc,argv);
auto str_path_in = options.path_in.string();
auto path_out=options.path_out;
if (boost::filesystem::create_directory(path_out))
{
std::cerr << "creating target directory\n";
}
provenance = std::string();
provenance += "vocab collected on " + get_str_time();
provenance += "source corpus : " + str_path_in + "\n";
std::cerr<<"assigning ids\n";
vocab.read_from_dir(str_path_in);
provenance = provenance + "words in corpus : "+ FormatHelper::ConvertToStr(vocab.cnt_words_processed)+"\n";
provenance = provenance + "unique words : "+ FormatHelper::ConvertToStr(vocab.cnt_words)+"\n";
vocab.reduce(options.min_frequency);
provenance=provenance+"filtered with minimal frequency: "+FormatHelper::ConvertToStr(options.min_frequency)+"\n";
provenance = provenance + "unique words : "+ FormatHelper::ConvertToStr(vocab.cnt_words)+"\n";
std::cerr<<"creating list of frequencies\n";
vocab.freq_per_id.resize(vocab.cnt_words);
vocab.lst_id2word.resize(vocab.cnt_words);
std::fill (vocab.freq_per_id.begin(),vocab.freq_per_id.end(),0);
std::cerr<<"populating frequencies\n";
vocab.populate_frequency();
vocab.reassign_ids(vocab.freq_per_id);
vocab.populate_frequency();
vocab.populate_ids();
std::cerr<<"dumping ids and frequencies\n";
vocab.dump_ids((path_out / boost::filesystem::path("ids")).string());
vocab.dump_frequency((path_out / boost::filesystem::path("frequencies")).string());
write_value_to_file((path_out / boost::filesystem::path("cnt_unique_words")).string(),vocab.cnt_words);
write_value_to_file((path_out / boost::filesystem::path("cnt_words")).string(),vocab.cnt_words_processed);
write_vector_to_file((path_out / boost::filesystem::path("freq_per_id")).string(),vocab.freq_per_id);
write_value_to_file((path_out / boost::filesystem::path("provenance.txt")).string(),provenance);
return 0;
}