In [3]:
import jieba
import jieba.analyse
In [4]:
s = "此外,公司拟对全资子公司吉林欧亚置业有限公司增资4.3亿元,增资后,吉林欧亚置业注册资本由7000万元增加到5亿元。吉林欧亚置业主要经营范围为房地产开发及百货零售等业务。目前在建吉林欧亚城市商业综合体项目。2013年,实现营业收入0万元,实现净利润-139.13万元。"
for x, w in jieba.analyse.extract_tags(s, withWeight=True):
print('%s %s' % (x, w))
In [5]:
import pymongo
db = pymongo.MongoClient().mfw_crawler
logs_col = db['logs-10030']
In [13]:
logs = logs_col.find(limit=100)
log_text = logs[100]['text_content']
In [12]:
for x, w in jieba.analyse.extract_tags(log_text, withWeight=True):
print('%s %s' % (x, w))
In [14]:
for x, w in jieba.analyse.textrank(log_text, withWeight=True):
print('{} {}'.format(x, w))