In [30]:
import jieba
In [31]:
seg_list = jieba.cut('我是一个山东人,我在北京工作,哈哈哈哈',cut_all=True) # 全模式
In [32]:
print('Full mode:' + '/'.join(seg_list))
In [33]:
seg_right = jieba.cut('我是一个山东人,我在北京工作,哈哈哈哈',cut_all=False)
In [34]:
print('default mode:' + '/'.join(seg_right))
In [35]:
import jieba.analyse as analyse
lines = open('jieba.txt',encoding='utf-8').read()
In [36]:
print(' '.join(analyse.extract_tags(lines,topK=20,withWeight=True)))