用python统计多个文本中你想统计的单词

来源:互联网 发布:知乎和百度关系 编辑:程序博客网 时间:2024/06/06 12:41
import collections #计数器import osimport stringpath = "/Users/U/workspace/python learning/show-me-the-code/0006/diary/" #diary dirdir = os.listdir(path) #读取目录sum = 0 #单词总数wanna = 'I' #想要统计的单词for file in dir: #遍历目录    with open(path + file) as diary:        list = diary.read().split(' ') #单词以空格分开        newlist = [word.translate(word.maketrans("","",string.punctuation)) for word in list] #干掉所有标点符号        #用maketrans创建一个映射表 translate根据映射表转化字符串        sum += int(collections.Counter(newlist)[wanna]) #统计所以日记中单词"I"的个数        #print(newlist) #test newlistprint('%s:%d' % (wanna,sum))

原创粉丝点击