https://github.com/ranran4082391/restaurant-comments 数据集地址
import pandas as pd
from dateutil import parser
from snownlp import SnowNLP
import matplotlib.pyplot as plt
import numpy as np
df = pd.read_excel('restaurant-comments.xlsx')
#df["date"] = df.date.apply(parser.parse)
def get_sentiment_cn(text):
s = SnowNLP(text)
return s.sentiments
df["sentiment"] = df.comments.apply(get_sentiment_cn)
sentiment_point = df["sentiment"].values
times_point = np.array([i for i in range(len(sentiment_point))])
print(sentiment_point.shape)
print(times_point.shape)
X = np.vstack((sentiment_point, times_point)).T
print(X.shape)
from sklearn.cluster import KMeans
y_pred = KMeans(n_clusters=2, random_state=9).fit_predict(X)
plt.scatter(X[:, 0], X[:, 1], c=y_pred)
plt.show()