wordcloud_hlm
This commit is contained in:
50
wordcloud_hlm.py
Normal file
50
wordcloud_hlm.py
Normal file
@@ -0,0 +1,50 @@
|
||||
from os import path
|
||||
from wordcloud import WordCloud
|
||||
import jieba
|
||||
import re
|
||||
#
|
||||
# special_character_removal = re.compile(r'[,。、【 】“”:;()《》‘’{}?!⑦%>℃.^-——=&#@¥『』]', re.IGNORECASE)
|
||||
#
|
||||
# #
|
||||
# # text =""
|
||||
# fw=open("hlm_seg.txt","w",encoding="utf-8")
|
||||
# with open('hlm.txt',encoding="utf-8") as fp:
|
||||
# for line in fp:
|
||||
# l = special_character_removal.sub('', line.strip())
|
||||
# words=jieba.cut(l)
|
||||
#
|
||||
# t=" ".join(words)
|
||||
# fw.write(t)
|
||||
# fw.write("\n")
|
||||
# fw.close()
|
||||
|
||||
|
||||
# import numpy as np
|
||||
# from PIL import Image, ImageDraw, ImageFont
|
||||
# background_image = np.array(Image.open("background.png"))
|
||||
d = path.dirname(__file__)
|
||||
# Read the whole text.
|
||||
text = open(path.join(d, 'hlm_seg.txt'),encoding="utf-8").read()
|
||||
# Generate a word cloud image
|
||||
# font=path.join(d, "simkai.ttf")
|
||||
font='C:/Windows/Fonts/simkai.ttf'
|
||||
wordcloud = WordCloud(font_path=font,#设置中文字体,不指定就会出现中文不显示
|
||||
width=1024,#宽
|
||||
height=840,#高
|
||||
background_color='white',#设置背景色
|
||||
# mask=background_image#背景
|
||||
# max_words=100,#最大词汇数
|
||||
# max_font_size=100#最大号字体
|
||||
).generate(text)
|
||||
|
||||
# Display the generated image:
|
||||
# the matplotlib way:
|
||||
import matplotlib.pyplot as plt
|
||||
|
||||
# lower max_font_size
|
||||
# wordcloud = WordCloud(max_font_size=40).generate(text)
|
||||
|
||||
plt.figure()
|
||||
plt.imshow(wordcloud)
|
||||
plt.axis("off")
|
||||
plt.show()
|
||||
Reference in New Issue
Block a user