期末综合大作业:词频统计

#1,
lFile = open('l.txt','r')
lTest = lFile.read()
lFile.close()
print(lTest)
#2,
print(lTest.replace(',',' '))
print(lTest.replace("'",' '))
print(lTest)
#3,
print(lTest.split(' '))
lList = lTest.split(' ')
#4,
lSet = set(lList)
print(lSet)

lDict = {}
for word in lSet:
    lDict[word] =lList.count(word)

print(lDict)
for d in lDict:
    print(d,lDict[d])

#5,
wordCountList = list(lDict.items())
print(wordCountList)
wordCountList.sort(key=lambda x:x[1],reverse=True)
print(wordCountList)
#6,
for i in range(20):
    print(wordCountList[1])
#7,
lCountFile = open('lCount.txt',mode='a',encoding='utf-8')
for i in range(len(wordCountList)):
    lCountFile.write(str(wordCountList[i][1])+' '+wordCountList[i][0]+'\n')
lCountFile.close()

posted on 2018-06-20 21:27  刘婵  阅读(77)  评论(0)    收藏  举报

导航