Python 词云
import requests
import jieba #结巴分词from wordcloud import WordCloud
import matplotlib.pyplot as plt
from scipy.misc import imread
respon=requests.get('https://www.d1xz.net/yunshi/today/Virgo/')
print(type(respon))
print(respon.url)
print(respon.encoding)
with open('D:/xingzuo.txt','w',encoding='UTF-8') as wt:
wt.write(respon.text)
with open('D:/xingzuo.txt','r',encoding='UTF-8') as rd:
for line in rd.readlines():
lowline= line.lower();
for c in lowline:
if len(c.encode()) < 3 :
lowline = lowline.replace(c,'')
lowiine=lowline.replace(' ','')
cut=jieba.cut(lowline)
with open('D:/cihai.txt','a',encoding='UTF-8') as f:
f.write(','.join(cut))
f = open('D:/cihai.txt','r',encoding='UTF-8').read()
print(type(f))
b_mask=imread('D:/back.JPG')
wordcloud=WordCloud(font_path='C:\Windows\Fonts\SIMLI.ttf',mask=b_mask,background_color='white').generate(f)
#背景图要透明的 为识别汉字 要添加windows字体
plt.axis('off')
plt.show()
wordcloud.to_file('test.jpg')