示例代码

import pandas as pd
import numpy as np

from pyecharts import options as opts
from pyecharts.charts import WordCloud

inputfile = "data_m2_t1_s2.csv"
outputfile = "image_m2_t2_s2.html"

df = pd.read_csv(inputfile)

def formatter(url):
    url = url.strip()
    if "https://" in url:
        url = url.split("https://")[1].split("/")[0]
        return url
    else:
        url = url.split("http://")[1].split("/")[0]
        return url

urlcounter = {

}

def getUrls(data):
    url = formatter(data['  url'])
    if url not in urlcounter:
        urlcounter[url] = 0

def setUrl(data):
    url = formatter(data['  url'])
    urlcounter[url] += 1

df.apply(lambda row: getUrls(row), axis=1)
df.apply(lambda row: setUrl(row), axis=1)

#print(urlcounter)

urls = list(urlcounter.keys())
counts = list(urlcounter.values())

urlTuple = []

for i in range(len(urls)):
    urlTuple.append((urls[i], counts[i]))

chart = (WordCloud(init_opts=opts.InitOpts(width="1920px",
                                          height="1080px"))
         .add(data_pair=urlTuple, series_name="统计词云图")
         .set_global_opts(title_opts=opts.TitleOpts(title="统计词云图"),
                          visualmap_opts=opts.VisualMapOpts(is_show=True, min_=0,
                                                            max_=25000))
         .render(outputfile))

效果展示