本文整理汇总了Python中FileIO.countFiles方法的典型用法代码示例。如果您正苦于以下问题:Python FileIO.countFiles方法的具体用法?Python FileIO.countFiles怎么用?Python FileIO.countFiles使用的例子?那么, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在类FileIO
的用法示例。
在下文中一共展示了FileIO.countFiles方法的2个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Python代码示例。
示例1: buildCorpus
# 需要导入模块: import FileIO [as 别名]
# 或者: from FileIO import countFiles [as 别名]
def buildCorpus(dirPath, corpusName):
print('creating corpus!!');
tagClass = fetchLabel(dirPath);
classCnt = FileIO.countFiles(dirPath);
dictionary = {};
FileIO.wrtieToFile("corpus\classCount.txt", 'a', (tagClass + '\t' + str(classCnt) + '\n' ));
for dir_entry in os.listdir(dirPath):
text = FileIO.readFile(os.path.join(dirPath, dir_entry));
text = Tokenizer.tokenizer(text);
for token in text.split('\n'):
if token not in dictionary:
dictionary[token] = {};
if tagClass not in dictionary[token]:
dictionary[token][tagClass] = 0;
dictionary[token][tagClass] = dictionary[token][tagClass] + 1;
for key, value in dictionary.items():
FileIO.wrtieToFile(corpusName, 'a', (key + '\t' + str(value[tagClass]) + '\t' + tagClass + '\n'));
print('Corpus creation : Done..');
示例2: buildBinarizedCorpus
# 需要导入模块: import FileIO [as 别名]
# 或者: from FileIO import countFiles [as 别名]
def buildBinarizedCorpus(dirPath, corpusName):
print('creating binarized corpus!!');
tagClass = fetchLabel(dirPath);
classCnt = FileIO.countFiles(dirPath);
FileIO.wrtieToFile("corpus\classCount.txt", 'a', (tagClass + '\t' + str(classCnt) + '\n' ));
corpusDict = {};
for dir_entry in os.listdir(dirPath):
fileTokens = {};
text = FileIO.readFile(os.path.join(dirPath, dir_entry));
text = Tokenizer.tokenizer(text);
for token in text.split('\n'):
if token not in fileTokens:
fileTokens[token] = 1;
if token not in corpusDict:
corpusDict[token] = {};
corpusDict[token][tagClass] = 1;
else:
corpusDict[token][tagClass] = corpusDict[token][tagClass] + 1;
for key, value in corpusDict.items():
FileIO.wrtieToFile(corpusName, 'a', (key + '\t' + str(value[tagClass]) + '\t' + tagClass + '\n' ));
print('binarized corpus creation done!!');