casio1374633

导航

 
import jieba
import os
import jieba.analyse


with open('src.txt', 'r') as file:
    data = file.read()

seg_list = jieba.cut(data, cut_all=True)
print("Full Mode:", "| ".join(seg_list))
seg_list = jieba.cut(data, cut_all=False)
print("Default Mode:", "| ".join(seg_list))  # 精确模式
seg_list = jieba.cut_for_search(data)  # 搜索引擎模式
print("Search Mode:", "| ".join(seg_list))
tags = jieba.analyse.extract_tags(data, topK=20) #TF-IDF方法获取top20关键词
print("TopK Mode:", "| ".join(tags))

 

posted on 2016-12-27 15:40  casio1374633  阅读(207)  评论(0编辑  收藏  举报