酒店评论情感分析
数据集位于链接:
提取码: 8w6p
import pandas as pd
import jieba
#加载文件
data = pd.read_csv('../data_test/htl_all.csv')
data['label'].value_counts()
data = data.tail((data['label'] == 0).sum() * 2)
data['label'].value_counts()
1 2443
0 2443
Name: label, dtype: int64
jieba.load_userdict('./mydict.txt')
def func(item)