哈姆雷特单词的排名

代码

def getText():
    txt = open("hamlet.txt","r").read()
    txt = txt.lower()
    for ch in '''~!@#$%^&*()_+{}|:"<>?;',./''':
        txt = txt.replace(ch," ")#去噪，为什么是以空格隔开，那个是因为有些单词之间仅仅是靠一个字符来连接
    return txt
hamletTxt = getText()
words = hamletTxt.split()#split返回一个列表
dict = {}
for word in words:
    dict[word]=dict.get(word,0)+1#get方法的后一个参数0代表的是当找不到值的时的默认返回值
list_cnt = list(dict.items())#无序字典转有序列表，才能排序
list_cnt.sort(key = lambda x:x[1],reverse=True)#x[1]代表的是键所对应的值
for i in range(10):
    print("{0:<10}{1:>5}".format(list_cnt[i][0],list_cnt[i][1]))

输出

the        1142
and         964
to          742
of          669
i           628
you         550
a           531
my          513
hamlet      470
in          450

read和没read

代码

txt = open("hamlet.txt","r").read()
print(type(txt))
txt = open("hamlet.txt", "r")
print(type(txt))

输出

<class 'str'>
<class '_io.TextIOWrapper'>

字典方法的返回类型

代码

print(type(dict.keys()))
print(type(dict.values()))
print(type(dict.items()))
print(type(dict))

输出

<class 'dict_keys'>
<class 'dict_values'>
<class 'dict_items'>
<class 'dict'>

资源

哈姆雷特文本
嵩天的书和网课