1 #-*- coding: utf-8 -*-
2 """
3 Created on Mon Oct 1 12:13:11 20184
5 @author: Luove6 """
7
8 importos9 importpandas as pd10 importjieba11 from gensim importcorpora, models12
13 os.chdir('D:\Analyze\Python Matlab\Python\BookCodes\Python数据分析与挖掘实战\图书配套数据、代码\chapter15\demo\code')14 filepath='../data/huizong.csv'
15 data=pd.read_csv(filepath)16 data.head()17 data_target=data[['评论']][data['品牌']=='美的']18 #set(data['品牌'])
19 count_1=len(data_target) #55774
20 data_target=pd.DataFrame(data_target['评论'].unique()) #去重后返回时array,需要DataFrame化
21 count_2=len(data_target) #53049
22 same_comment_count=count_1-count_2 #2725,5%
23
24 inputfile1 = '../data/meidi_jd_process_end_负面情感结果.txt' #来之ROSTCM6软件,情感倾向性分析,负面、中性、正面,这里只研究负面、正面
25 i