Data¶
In [2]:
reviews = pd.read_csv("fandango_score_comparison.csv")
In [4]:
reviews.head()
Out[4]:
In [7]:
cols = ['FILM', 'RT_user_norm', 'Metacritic_user_nom', 'IMDB_norm', 'Fandango_Ratingvalue']
norm_reviews = reviews[cols]
norm_reviews.head()
Out[7]:
Frequency counts¶
In [14]:
fandango_distribution = norm_reviews['Fandango_Ratingvalue'].value_counts().sort_index()
imdb_distribution = norm_reviews['IMDB_norm'].value_counts().sort_index()
print(fandango_distribution)
print(imdb_distribution)
Histogram¶
In [18]:
fig, ax = plt.subplots()
ax.hist(norm_reviews['Fandango_Ratingvalue'], range=(0, 5))
plt.show()
In [19]:
fig, ax = plt.subplots()
ax.hist(norm_reviews['Fandango_Ratingvalue'], range=(0, 5), bins = 20)
plt.show()
In [25]:
fig = plt.figure(figsize=(15,8))
ax1 = fig.add_subplot(2,2,1)
ax2 = fig.add_subplot(2,2,2)
ax3 = fig.add_subplot(2,2,3)
ax4 = fig.add_subplot(2,2,4)
ax1.hist(norm_reviews["Fandango_Ratingvalue"], range = (0,5) , bins = 20)
ax1.set_ylim(0,50)
ax1.set_title("Distribution of Fandango Ratings")
ax2.hist(norm_reviews["RT_user_norm"], range = (0,5) , bins = 20)
ax2.set_ylim(0,50)
ax2.set_title("Distribution of Rotten Tomatoes Ratings")
ax3.hist(norm_reviews["Metacritic_user_nom"], range = (0,5) , bins = 20)
ax3.set_ylim(0,50)
ax3.set_title("Distribution of Metacritic Ratings")
ax4.hist(norm_reviews["IMDB_norm"], range = (0,5) , bins = 20)
ax4.set_ylim(0,50)
ax4.set_title("Distribution of IMDB Ratings")
Out[25]:
Boxplot¶
In [26]:
fig,ax = plt.subplots()
ax.boxplot(norm_reviews["RT_user_norm"])
ax.set_ylim(0,5)
ax.set_xticklabels(["Rotten Tomatoes"])
Out[26]:
Multiple Boxplots¶
In [29]:
num_cols = ['RT_user_norm', 'Metacritic_user_nom', 'IMDB_norm', 'Fandango_Ratingvalue']
fig, ax = plt.subplots(figsize = (10,8))
ax.boxplot(norm_reviews[num_cols].values)
ax.set_xticklabels(num_cols, rotation=90)
ax.set_ylim(0,5)
plt.show()
No comments :
Post a Comment