import pandas as pd
import matplotlib.pyplot as plt
reviews = pd.read_csv("D:\\test\\fandango_scores.csv")
clos = ["Fandango_Ratingvalue","RT_norm","IMDB_norm","RT_norm_round","Metacritic_norm_round"]
reviews_num = reviews[clos]
dis_imdb = reviews_num["Fandango_Ratingvalue"].value_counts()
dis_index = dis_imdb.sort_index()
print(dis_imdb)
print(dis_index)
4.1 16
3.9 12
4.2 12
4.3 11
3.4 9
4.5 9
3.5 9
3.7 9
3.6 8
4.0 7
4.4 7
3.2 5
2.9 5
3.8 5
3.3 4
3.0 4
4.6 4
3.1 3
4.8 3
2.8 2
2.7 2
Name: Fandango_Ratingvalue, dtype: int64
2.7 2
2.8 2
2.9 5
3.0 4
3.1 3
3.2 5
3.3 4
3.4 9
3.5 9
3.6 8
3.7 9
3.8 5
3.9 12
4.0 7
4.1 16
4.2 12
4.3 11
4.4 7
4.5 9
4.6 4
4.8 3
Name: Fandango_Ratingvalue, dtype: int64
fig,ax = plt.subplots()
ax.hist(reviews_num["Fandango_Ratingvalue"],bins=20,range=(4,5))
plt.show()
fig = plt.figure(figsize=(5,20))
ax1= fig.add_subplot(4,1,1)
ax2= fig.add_subplot(4,1,2)
ax1.hist(reviews_num["Fandango_Ratingvalue"],bins=20,range=(0,5))
ax1.set_title("Distribution Rating")
ax1.set_ylim(0,50)
ax2.hist(reviews_num["RT_norm"],bins=20,range=(0,5))
ax2.set_title("Distribution Rating")
ax2.set_ylim(0,50)
plt.show()
fig,ax = plt.subplots()
ax.boxplot(reviews_num["RT_norm"])
ax.set_xticklabels(["RT_norm"])
ax.set_ylim(0,5)
plt.show()
fig,ax = plt.subplots()
ax.boxplot(reviews_num[clos].values)
ax.set_xticklabels(clos,rotation=90)
ax.set_ylim(0,5)
plt.show()