# Ignore the warningsimport warnings
warnings.filterwarnings('always')
warnings.filterwarnings('ignore')
import csv
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import jieba
import PIL.Image as Image
from jieba import analyse
from wordcloud import WordCloud
from snownlp import SnowNLP
%matplotlib inline
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 23486 entries, 0 to 23485
Data columns (total 11 columns):
Unnamed: 0 23486 non-null int64
Clothing ID 23486 non-null int64
Age 23486 non-null int64
Title 19676 non-null object
Review Text 22641 non-null object
Rating 23486 non-null int64
Recommended IND 23486 non-null int64
Positive Feedback Count 23486 non-null int64
Division Name 23472 non-null object
Department Name 23472 non-null object
Class Name 23472 non-null object
dtypes: int64(6), object(5)
memory usage: 2.0+ MB
time: 14 ms
观察数据是否缺失
df.isnull().sum()
Unnamed: 0 0
Clothing ID 0
Age 0
Title 3810
Review Text 845
Rating 0
Recommended IND 0
Positive Feedback Count 0
Division Name 14
Department Name 14
Class Name 14
dtype: int64
time: 12.5 ms