词频次数jieba库西游记

import jieba

f = open('西游记.txt', mode='r',encoding='ANSI')
txt = f.read()
txt = jieba.lcut(txt)


buyao = ['。',',',':','“','”','?','、','《','》','!','!','\n','道','了','我',
'的','他','你','那','是','也','在','有','又','去','与','来','这','就',
'却','不','见','着','把','等','将','说',';','上','都','一个','好','个',
'叫',';','得','到','看','只','还','那里','怎么','我们','不知','两个',
'甚么','不是','只见']

count = {}
for ch in txt:
if ch not in buyao:
if len(ch) == 1:
continue
else:
count[ch] = count.get(ch, 0) + 1
items = list(count.items())
items.sort(key=lambda x: x[1], reverse=True)

for i in range(20):
rw, gs=items[i]
print("{0:5} {1:5}".format(rw, gs))

 

posted @ 2021-11-14 10:56  怜雨慕  阅读(70)  评论(0)    收藏  举报