In [None]:
from pyecharts import options as opts
from pyecharts.charts import Pie
from IPython.display import HTML

def load_dataset(file_name:str, mood_list:list, dataset_name):
    mood_values = []
    dataset = {}
    total = 0

    for mood in mood_list:
        dataset[mood] = []

    with open(file_name, encoding='UTF-8') as f:
        for line in f.readlines():
            items = line.split(':', 1)
            dataset[items[0]].append(items[1])
            total += 1
        f.close()

    for mood in mood_list:
        print('{}：{}'.format(mood, len(dataset[mood])))

    print('total：{}'.format(total))
    print('#' * 40)

    for mood in mood_list:
        mood_values.append(100 * (len(dataset[mood]) / total))
        print('{}：{:.4f}%'.format(mood, 100 * (len(dataset[mood]) / total)))

    pie = Pie(init_opts=opts.InitOpts(width="100%", height="600px", bg_color="#2c343c"))\
        .add("", [list(z) for z in zip(mood_list, mood_values)])\
        .set_global_opts(
        title_opts=opts.TitleOpts(
            title=dataset_name,
            pos_top="10",
            pos_left="10",
            title_textstyle_opts=opts.TextStyleOpts(color="#fff", font_size=28)),
        legend_opts=opts.LegendOpts(pos_top="15%", pos_left="10", orient="vertical", textstyle_opts={"color":"white"}))\
        .set_series_opts(label_opts=opts.LabelOpts(formatter="{b}: {c}%"))

    HTML(pie.render_embed())

### 🤩Weibo Emotion Corpus 七分类多情感分析

2016 The Hong Kong Polytechnic University	微博语料，标注了7 emotions: like, disgust, happiness, sadness, anger, surprise, fear。
- 数据条目：39661条
- 论文地址：http://www.lrec-conf.org/proceedings/lrec2016/pdf/515_Paper.pdf
- 数据地址：https://github.com/hehuihui1994/emotion_corpus_weibo/blob/master/emotion_corpus_microblog.txt
- 文件名称：emotion_corpus_microblog.txt
- 文件大小：5.50MB
- 来源：香港理工大学

> happiness: 9959<br>
> disgust: 4876<br>
> like: 4540<br>
> fear: 661<br>
> sadness: 14052<br>
> anger: 4562<br>
> surprise: 1011<br>

In [None]:
load_dataset("emotion_corpus_microblog.txt",
             ['anger', 'disgust', 'happiness', 'like', 'sadness', 'fear', 'surprise'],
             "Weibo Emotion Corpus")

### 🧐simplifyweibo_8_moods 八分类多情感分析

八分类情感分类数据集，详细带None
- 数据条目：26462条数据
- 文件名称：simplifyweibo_8_moods.txt
- 文件大小：2.20MB
- 来源：CSDN

> happiness：1456<br>
> disgust：2008<br>
> like：2446<br>
> fear：230<br>
> sadness：1676<br>
> anger：1436<br>
> surprise：620<br>
> none：16590<br>

In [None]:
load_dataset("simplifyweibo_8_moods.txt",
             ['anger', 'disgust', 'happiness', 'like', 'sadness', 'fear', 'surprise', 'none'],
             "simplifyweibo_8_moods")

### 🧐Nlpcc2014Train 八分类多情感分析

Nlpcc2014八分类情感分类数据集，详细带None，包含2013Nlpcc数据
- 数据条目：48875条
- 文件名称：Nlpcc2014Train.txt
- 文件大小：4.12MB
- 来源：Nlpcc

> happiness：3192<br>
> disgust：3433<br>
> like：4921<br>
> fear：332<br>
> sadness：2787<br>
> anger：2138<br>
> surprise：901<br>
> none：31171<br>

In [None]:
load_dataset("Nlpcc2014Train.txt",
             ['anger', 'disgust', 'happiness', 'like', 'sadness', 'fear', 'surprise', 'none'],
             "Nlpcc2014Train")