From 7d67de6ba02b2393378ee7848bbb424341d05226 Mon Sep 17 00:00:00 2001 From: hnu202111020216 Date: Wed, 5 Jan 2022 15:41:17 +0800 Subject: [PATCH] ADD file via upload --- 字典的运用:词频统计.py | 38 +++++++++++++++++++++++++++++++ 1 file changed, 38 insertions(+) create mode 100644 字典的运用:词频统计.py diff --git a/字典的运用:词频统计.py b/字典的运用:词频统计.py new file mode 100644 index 0000000..80cd625 --- /dev/null +++ b/字典的运用:词频统计.py @@ -0,0 +1,38 @@ +# -*- coding: utf-8 -*- +""" +Created on Mon Nov 22 17:19:33 2021 + +@author: Administrator +""" + +WordStr=input() +WordStr=WordStr.lower() +for ch in "\".,~!@#$%^&*()+_\/0123456789": + WordStr=WordStr.replace(ch," ") +print(WordStr) +#字符分割 +wordlist=WordStr.split() +print(wordlist) +#统计词频 +dict1={} +for word in wordlist: + if word not in dict1: + dict1[word]=1#创建键值对 + else: + dict1[word]=dict1[word]+1 +print(dict1) +#排序 +#new1=sorted(dict1.values(),reverse=True)#sorted函数默认升序排列并且按照ASCII值排列 +#print(new1) +new2=sorted(dict1.items(),key=lambda d:d[1],reverse=True)#key=lambda d:d[1]对第二维即value进行排序 +print(new2)#排完之后是list类型 +new3=dict(new2) +print(new3) +print(max(new3.values())) +for key,value in new3.items():#遍历键值 + if value>=max(new3.values()): + print(key,value) + + + +