Python 词云

import requests

import jieba #结巴分词
from wordcloud import WordCloud
import matplotlib.pyplot as plt
from scipy.misc import imread

respon=requests.get('https://www.d1xz.net/yunshi/today/Virgo/')
print(type(respon))
print(respon.url)
print(respon.encoding)
with open('D:/xingzuo.txt','w',encoding='UTF-8') as wt:
wt.write(respon.text)

with open('D:/xingzuo.txt','r',encoding='UTF-8') as rd:
for line in rd.readlines():
lowline= line.lower();
for c in lowline:
if len(c.encode()) < 3 :
lowline = lowline.replace(c,'')
lowiine=lowline.replace(' ','')
cut=jieba.cut(lowline)
with open('D:/cihai.txt','a',encoding='UTF-8') as f:
f.write(','.join(cut))
f = open('D:/cihai.txt','r',encoding='UTF-8').read()
print(type(f))
b_mask=imread('D:/back.JPG')

wordcloud=WordCloud(font_path='C:\Windows\Fonts\SIMLI.ttf',mask=b_mask,background_color='white').generate(f)

#背景图要透明的为识别汉字要添加windows字体

plt.imshow(wordcloud)
plt.axis('off')
plt.show()

wordcloud.to_file('test.jpg')

Python 词云

相关推荐