利用python处理文档中各字段出现的次数并排序

1 import string
2 path = 'waldnn'
3 with open(path,'r') as text:
4     words = [raw_word.strip(string.punctuation).lower() for raw_word in text.read().split()]
5     words_index = set(words)
6     counts_dict = {index:words.count(index) for index in words_index}
7 
8 for word in sorted(counts_dict,key=lambda x: counts_dict[x],reverse=True):
9     print('{} -- {} times'.format(word,counts_dict[word]))

 

posted @ 2017-03-10 19:23  Erick-LONG  阅读(1596)  评论(0编辑  收藏  举报