问题描述
#what is the most frequent words?
data['document_content']=data['document_content'].apply(lambda x:"".join(x.lower() for x in x.split()))
data['document_content']=data['document_content'].str.replace('[^\w\s]',' ')
data['document_content']=data['document_content'].str.replace('\d',' ')
#stopwords
import nltk
nltk.download('stopwords')
from nltk.corpus import stopwords
sw=stopwords.words('english')
data['document_content']=data['document_content'].apply(lambda x: " ".join(x for x in x.split() if x not in sw))
#lemma
from textblob import Word
nltk.download('wordnet')
data['document_content']=data['document_content'].apply(lambda x:" ".join([Word(word).lemmatize() for word in x.split()]))
#punctuation
data['document_content']=data['document_content'].str.replace("rt"," ")
data['document_content'].head()
from os import path
from PIL import Image
from wordcloud import WordCloud,STOPWORDS,ImageColorGenerator
import matplotlib.pyplot as plt
text="".join(i for i in data.document_content)
wc=WordCloud(background_color="black").generate(str(data.document_content))
plt.imshow(wc,interpolation="bilinear")
plt.axis("off")
plt.tight_layout(pad=1)
plt.show()
但它不返回图像而只返回 "Canvas(toolbar=Toolbar(toolitems=[('Home','Reset original view','home','home'),('Back','Back to prevIoUs ..."
解决方法
暂无找到可以解决该程序问题的有效方法,小编努力寻找整理中!
如果你已经找到好的解决方法,欢迎将解决方案带上本链接一起发送给小编。
小编邮箱:dio#foxmail.com (将#修改为@)