import jieba import wordcloud def takeSecond(elem): return elem[1] def createWordCloud(text): w=wordcloud.WordCloud (font_path="msyh.ttf",width=1000,height=500,background_color="white").generate(text) w.to_file("西游记词云图.jpg") def main(): path = "西游记.txt" file = open(path,"r",encoding="utf-8") text=file.read() file.close() words = jieba.lcut(text) counts = {} for word in words: if len(word) == 1: continue elif word == "大圣" or word=="老孙" or word=="行者" or word=="孙大圣" or word=="孙行者" or word=="猴王" or word=="悟空" or word=="齐天大圣" or word=="猴子": rword = "孙悟空" elif word == "师父" or word == "三藏" or word=="圣僧": rword = "唐僧" elif word == "呆子" or word=="八戒" or word=="老猪": rword = "猪八戒" elif word=="沙和尚": rword="沙僧" elif word == "妖精" or word=="妖魔" or word=="妖道": rword = "妖怪" elif word=="佛祖": rword="如来" elif word=="三太子": rword="白马" else: rword = word counts[rword] = counts.get(rword,0) + 1 file = open("excludes.txt","r",encoding="utf-8") excludes =file.read().split(",") file.close for delWord in excludes: try: del counts[delWord] except: continue items = list(counts.items()) items.sort(key = takeSecond,reverse=True) for i in range(20): item=items[i] keyWord =item[0] count=item[1] print("{0:<10}{1:>5}".format(keyWord,count)) createWordCloud(str(items[0:20])) main()
时间: 2024-04-06 16:34:57 浏览: 178
在代码中有以下几个错误:
1. 第一行代码应该在同一行,不能出现换。
2. 第二行代码需要加上空格。
3. 第四行代码需要加上空格。
4. 第18行代码需要加上空格。
5. 第27行代码`file.close`后需要加上括号。
6. 第37行代码`file.close`后需要加上括号。
7. 第51行代码的`range(20)`应该改为`range(len(items))`。
8. 第54行代码需要加上括号。
这是修改后的代码:
```
import jieba
import wordcloud
def takeSecond(elem):
return elem[1]
def createWordCloud(text):
w=wordcloud.WordCloud(font_path="msyh.ttf", width=1000, height=500, background_color="white").generate(text)
w.to_file("西游记词云图.jpg")
def main():
path = "西游记.txt"
file = open(path, "r", encoding="utf-8")
text = file.read()
file.close()
words = jieba.lcut(text)
counts = {}
for word in words:
if len(word) == 1:
continue
elif word == "大圣" or word == "老孙" or word == "行者" or word == "孙大圣" or word == "孙行者" or word == "猴王" or word == "悟空" or word == "齐天大圣" or word == "猴子":
rword = "孙悟空"
elif word == "师父" or word == "三藏" or word == "圣僧":
rword = "唐僧"
elif word == "呆子" or word == "八戒" or word == "老猪":
rword = "猪八戒"
elif word == "沙和尚":
rword = "沙僧"
elif word == "妖精" or word == "妖魔" or word == "妖道":
rword = "妖怪"
elif word == "佛祖":
rword = "如来"
elif word == "三太子":
rword = "白马"
else:
rword = word
counts[rword] = counts.get(rword, 0) + 1
file = open("excludes.txt", "r", encoding="utf-8")
excludes = file.read().split(",")
file.close()
for delWord in excludes:
try:
del counts[delWord]
except:
continue
items = list(counts.items())
items.sort(key=takeSecond, reverse=True)
for i in range(len(items)):
item = items[i]
keyWord = item[0]
count = item[1]
print("{0:<10}{1:>5}".format(keyWord, count))
createWordCloud(str(items[0:20]))
main()
```
阅读全文