CCF | 可视化-词云图
示例代码
import pandas as pd
import numpy as np
from pyecharts import options as opts
from pyecharts.charts import WordCloud
inputfile = "data_m2_t1_s2.csv"
outputfile = "image_m2_t2_s2.html"
df = pd.read_csv(inputfile)
def formatter(url):
url = url.strip()
if "https://" in url:
url = url.split("https://")[1].split("/")[0]
return url
else:
url = url.split("http://")[1].split("/")[0]
return url
urlcounter = {
}
def getUrls(data):
url = formatter(data[' url'])
if url not in urlcounter:
urlcounter[url] = 0
def setUrl(data):
url = formatter(data[' url'])
urlcounter[url] += 1
df.apply(lambda row: getUrls(row), axis=1)
df.apply(lambda row: setUrl(row), axis=1)
#print(urlcounter)
urls = list(urlcounter.keys())
counts = list(urlcounter.values())
urlTuple = []
for i in range(len(urls)):
urlTuple.append((urls[i], counts[i]))
chart = (WordCloud(init_opts=opts.InitOpts(width="1920px",
height="1080px"))
.add(data_pair=urlTuple, series_name="统计词云图")
.set_global_opts(title_opts=opts.TitleOpts(title="统计词云图"),
visualmap_opts=opts.VisualMapOpts(is_show=True, min_=0,
max_=25000))
.render(outputfile))效果展示

本文是原创文章,采用 CC BY-NC-ND 4.0 协议,完整转载请注明来自 Summer
评论
匿名评论
隐私政策
你无需删除空行,直接评论以获取最佳展示效果