51 lines
1.6 KiB
Python
51 lines
1.6 KiB
Python
from os import path
|
|
from wordcloud import WordCloud
|
|
import jieba
|
|
import re
|
|
#
|
|
# special_character_removal = re.compile(r'[,。、【 】“”:;()《》‘’{}?!⑦%>℃.^-——=&#@¥『』]', re.IGNORECASE)
|
|
#
|
|
# #
|
|
# # text =""
|
|
# fw=open("hlm_seg.txt","w",encoding="utf-8")
|
|
# with open('hlm.txt',encoding="utf-8") as fp:
|
|
# for line in fp:
|
|
# l = special_character_removal.sub('', line.strip())
|
|
# words=jieba.cut(l)
|
|
#
|
|
# t=" ".join(words)
|
|
# fw.write(t)
|
|
# fw.write("\n")
|
|
# fw.close()
|
|
|
|
|
|
# import numpy as np
|
|
# from PIL import Image, ImageDraw, ImageFont
|
|
# background_image = np.array(Image.open("background.png"))
|
|
d = path.dirname(__file__)
|
|
# Read the whole text.
|
|
text = open(path.join(d, 'hlm_seg.txt'),encoding="utf-8").read()
|
|
# Generate a word cloud image
|
|
# font=path.join(d, "simkai.ttf")
|
|
font='C:/Windows/Fonts/simkai.ttf'
|
|
wordcloud = WordCloud(font_path=font,#设置中文字体,不指定就会出现中文不显示
|
|
width=1024,#宽
|
|
height=840,#高
|
|
background_color='white',#设置背景色
|
|
# mask=background_image#背景
|
|
# max_words=100,#最大词汇数
|
|
# max_font_size=100#最大号字体
|
|
).generate(text)
|
|
|
|
# Display the generated image:
|
|
# the matplotlib way:
|
|
import matplotlib.pyplot as plt
|
|
|
|
# lower max_font_size
|
|
# wordcloud = WordCloud(max_font_size=40).generate(text)
|
|
|
|
plt.figure()
|
|
plt.imshow(wordcloud)
|
|
plt.axis("off")
|
|
plt.show()
|