word = '''
Lately, I've been, I've been losing sleep
Dreaming about the things that we could be
But baby, I've been, I've been praying hard,
Said, no more counting dollars
We'll be counting stars, yeah we'll be counting stars
I see this life like a swinging vine
Swing my heart across the line
And my face is flashing signs
Seek it out and you shall find
Old, but I'm not that old
Young, but I'm not that bold
I don't think the world is sold
I'm just doing what we're told
I feel something so right
Doing the wrong thing
I feel something so wrong
Doing the right thing
I could lie, coudn't I, could lie
Everything that kills me makes me feel alive
Lately, I've been, I've been losing sleep
Dreaming about the things that we could be
But baby, I've been, I've been praying hard,
Said, no more counting dollars
We'll be counting stars
'''
#标点替换为空格
symbol = [",", ".", "!", "?", "'", ":", "-"]
#无意义的单词
words = ['t','ve','ll','m']
new_art = word
for i in range(len(symbol)):
new_art = new_art.replace(symbol[i],' ') #把文章的标点符号替换
new_art = new_art.lower() #改成小写
art_list = new_art.split() #以空格将字符串分成单词列表
dic = dict(zip())
for i in art_list:
dic[i] = new_art.count(i) #用字典记录单词和其出现次数
for i in words:
if(dic.get(i)!=None): #如果为冠词之类的无意义的词,将其舍弃
dic.pop(i)
new_dic = sorted(dic.items(),key=lambda x:x[1],reverse = True)
for i in range(10):
print(new_dic[i]) #取出现频率最高的10个单词