import pandas as pd
fandango_before = pd.read_csv('fandango_score_comparison.csv')
fandango_16_17 = pd.read_csv('movie_ratings_16_17.csv')


print(fandango_before.head())

                             FILM  RottenTomatoes  RottenTomatoes_User  \
0  Avengers: Age of Ultron (2015)              74                   86   
1               Cinderella (2015)              85                   80   
2                  Ant-Man (2015)              80                   90   
3          Do You Believe? (2015)              18                   84   
4   Hot Tub Time Machine 2 (2015)              14                   28   

   Metacritic  Metacritic_User  IMDB  Fandango_Stars  Fandango_Ratingvalue  \
0          66              7.1   7.8             5.0                   4.5   
1          67              7.5   7.1             5.0                   4.5   
2          64              8.1   7.8             5.0                   4.5   
3          22              4.7   5.4             5.0                   4.5   
4          29              3.4   5.1             3.5                   3.0   

   RT_norm  RT_user_norm         ...           IMDB_norm  RT_norm_round  \
0     3.70           4.3         ...                3.90            3.5   
1     4.25           4.0         ...                3.55            4.5   
2     4.00           4.5         ...                3.90            4.0   
3     0.90           4.2         ...                2.70            1.0   
4     0.70           1.4         ...                2.55            0.5   

   RT_user_norm_round  Metacritic_norm_round  Metacritic_user_norm_round  \
0                 4.5                    3.5                         3.5   
1                 4.0                    3.5                         4.0   
2                 4.5                    3.0                         4.0   
3                 4.0                    1.0                         2.5   
4                 1.5                    1.5                         1.5   

   IMDB_norm_round  Metacritic_user_vote_count  IMDB_user_vote_count  \
0              4.0                        1330                271107   
1              3.5                         249                 65709   
2              4.0                         627                103660   
3              2.5                          31                  3136   
4              2.5                          88                 19560   

   Fandango_votes  Fandango_Difference  
0           14846                  0.5  
1           12640                  0.5  
2           12055                  0.5  
3            1793                  0.5  
4            1021                  0.5  

[5 rows x 22 columns]


print(fandango_16_17.head())

                     movie  year  metascore  imdb  tmeter  audience  fandango  \
0      10 Cloverfield Lane  2016         76   7.2      90        79       3.5   
1                 13 Hours  2016         48   7.3      50        83       4.5   
2      A Cure for Wellness  2016         47   6.6      40        47       3.0   
3          A Dog's Purpose  2017         43   5.2      33        76       4.5   
4  A Hologram for the King  2016         58   6.1      70        57       3.0   

   n_metascore  n_imdb  n_tmeter  n_audience  nr_metascore  nr_imdb  \
0         3.80    3.60      4.50        3.95           4.0      3.5   
1         2.40    3.65      2.50        4.15           2.5      3.5   
2         2.35    3.30      2.00        2.35           2.5      3.5   
3         2.15    2.60      1.65        3.80           2.0      2.5   
4         2.90    3.05      3.50        2.85           3.0      3.0   

   nr_tmeter  nr_audience  
0        4.5          4.0  
1        2.5          4.0  
2        2.0          2.5  
3        1.5          4.0  
4        3.5          3.0


fd_rev = fandango_before[['FILM','Fandango_Stars','Fandango_Ratingvalue','Fandango_votes','Fandango_Difference']]
fd_rev.head()


fd_16_17_rev = fandango_16_17[['movie','year','fandango']]
fd_16_17_rev.head()


fd_16_17_rev.sample(10, random_state = 1)


fd_rev[fd_rev['Fandango_votes']<30].shape[0]

0


fd_2015 = fd_rev[fd_rev['FILM'].str.contains('2015')]
fd_2015


fd_2016 = fd_16_17_rev[fd_16_17_rev['year'] == 2016]
fd_2016['year'].value_counts()

2016    191
Name: year, dtype: int64


fd_2016


import matplotlib.pyplot as plt
import seaborn as sns
import numpy as np
%matplotlib inline
plt.style.use('fivethirtyeight')

plt.figure(figsize = (8,5.5))
fd_2015['Fandango_Stars'].plot.kde(label = '2015_Rating', legend = True)
fd_2016['fandango'].plot.kde(label = '2016_Rating', legend = True)
plt.xticks(np.arange(0,5.0,0.5))
plt.xlim((0,5.0))
plt.xlabel('Stars')
plt.title('Comparing Distribution Shapes for 2015 and 2016')

<matplotlib.text.Text at 0x7f7f9bba1780>


fd_2015['Fandango_Stars'].value_counts().sort_index()

3.0    11
3.5    23
4.0    37
4.5    49
5.0     9
Name: Fandango_Stars, dtype: int64


fd_2016['fandango'].value_counts().sort_index()

2.5     6
3.0    14
3.5    46
4.0    77
4.5    47
5.0     1
Name: fandango, dtype: int64


(fd_2015['Fandango_Stars'].value_counts(normalize= True)*100).sort_index()

3.0     8.527132
3.5    17.829457
4.0    28.682171
4.5    37.984496
5.0     6.976744
Name: Fandango_Stars, dtype: float64


(fd_2016['fandango'].value_counts(normalize = True)*100).sort_index()

2.5     3.141361
3.0     7.329843
3.5    24.083770
4.0    40.314136
4.5    24.607330
5.0     0.523560
Name: fandango, dtype: float64


mean_fd_2015 = fd_2015['Fandango_Stars'].mean()
med_fd_2015 = fd_2015['Fandango_Stars'].median()
mode_fd_2015 = fd_2015['Fandango_Stars'].mode().iloc[0]

mean_fd_2016 = fd_2016['fandango'].mean()
med_fd_2016 = fd_2016['fandango'].median()
mode_fd_2016 = fd_2016['fandango'].mode().iloc[0]


summary_df = pd.DataFrame( index = ['mean','median','mode'])

summary_df['2015'] = [mean_fd_2015,med_fd_2015,mode_fd_2015]
summary_df['2016'] = [mean_fd_2016,med_fd_2016,mode_fd_2016]

summary_df.head()


plt.style.use('fivethirtyeight')
plt.figure(figsize=(8,5))


summary_df['2015'].plot.bar(width = 0.3, align = 'center', label = '2015', color = 'blue')
summary_df['2016'].plot.bar(width = 0.3,align = 'edge', label = '2016' ,color = '#cc0000')
plt.ylim((0.0,5.0))
plt.yticks(np.arange(0.0,5.5,0.5))
plt.title('Comparing summary statistics: 2015 vs 2016',y = 1.08, fontdict= {'size':'18','fontweight':'normal'})
plt.ylabel('Stars')
plt.xticks(rotation=0)
plt.legend(loc = 'upper center')

<matplotlib.legend.Legend at 0x7f7f9ba89f60>

	2015	2016
mean	4.085271	3.887435
median	4.000000	4.000000
mode	4.500000	4.000000

Is Fandango Still Inflating Ratings?¶

Changing the Goal of our Analysis¶

Isolating the Samples We Need¶

Comparing Distribution Shapes for 2015 and 2016¶

Comparing Relative Frequencies¶

Confirming the direction of difference with summary stats¶

Conclusion:¶

	FILM	Fandango_Stars	Fandango_Ratingvalue	Fandango_votes	Fandango_Difference
0	Avengers: Age of Ultron (2015)	5.0	4.5	14846	0.5
1	Cinderella (2015)	5.0	4.5	12640	0.5
2	Ant-Man (2015)	5.0	4.5	12055	0.5
3	Do You Believe? (2015)	5.0	4.5	1793	0.5
4	Hot Tub Time Machine 2 (2015)	3.5	3.0	1021	0.5

	movie	year	fandango
0	10 Cloverfield Lane	2016	3.5
1	13 Hours	2016	4.5
2	A Cure for Wellness	2016	3.0
3	A Dog's Purpose	2017	4.5
4	A Hologram for the King	2016	3.0

	movie	year	fandango
108	Mechanic: Resurrection	2016	4.0
206	Warcraft	2016	4.0
106	Max Steel	2016	3.5
107	Me Before You	2016	4.5
51	Fantastic Beasts and Where to Find Them	2016	4.5
33	Cell	2016	3.0
59	Genius	2016	3.5
152	Sully	2016	4.5
4	A Hologram for the King	2016	3.0
31	Captain America: Civil War	2016	4.5

	FILM	Fandango_Stars	Fandango_Ratingvalue	Fandango_votes	Fandango_Difference
0	Avengers: Age of Ultron (2015)	5.0	4.5	14846	0.5
1	Cinderella (2015)	5.0	4.5	12640	0.5
2	Ant-Man (2015)	5.0	4.5	12055	0.5
3	Do You Believe? (2015)	5.0	4.5	1793	0.5
4	Hot Tub Time Machine 2 (2015)	3.5	3.0	1021	0.5
5	The Water Diviner (2015)	4.5	4.0	397	0.5
6	Irrational Man (2015)	4.0	3.5	252	0.5
8	Shaun the Sheep Movie (2015)	4.5	4.0	896	0.5
9	Love & Mercy (2015)	4.5	4.0	864	0.5
10	Far From The Madding Crowd (2015)	4.5	4.0	804	0.5
11	Black Sea (2015)	4.0	3.5	218	0.5
15	Taken 3 (2015)	4.5	4.1	6757	0.4
16	Ted 2 (2015)	4.5	4.1	6437	0.4
17	Southpaw (2015)	5.0	4.6	5597	0.4
19	Pixels (2015)	4.5	4.1	3886	0.4
20	McFarland, USA (2015)	5.0	4.6	3364	0.4
21	Insidious: Chapter 3 (2015)	4.5	4.1	3276	0.4
22	The Man From U.N.C.L.E. (2015)	4.5	4.1	2686	0.4
23	Run All Night (2015)	4.5	4.1	2066	0.4
24	Trainwreck (2015)	4.5	4.1	8381	0.4
26	Ex Machina (2015)	4.5	4.1	3458	0.4
27	Still Alice (2015)	4.5	4.1	1258	0.4
29	The End of the Tour (2015)	4.5	4.1	121	0.4
30	Red Army (2015)	4.5	4.1	54	0.4
31	When Marnie Was There (2015)	4.5	4.1	46	0.4
32	The Hunting Ground (2015)	4.5	4.1	42	0.4
33	The Boy Next Door (2015)	4.0	3.6	2800	0.4
34	Aloha (2015)	3.5	3.1	2284	0.4
35	The Loft (2015)	4.0	3.6	811	0.4
36	5 Flights Up (2015)	4.0	3.6	79	0.4
...	...	...	...	...	...
115	While We're Young (2015)	3.0	2.9	449	0.1
116	Clouds of Sils Maria (2015)	3.5	3.4	162	0.1
117	Testament of Youth (2015)	4.0	3.9	127	0.1
118	Infinitely Polar Bear (2015)	4.0	3.9	124	0.1
119	Phoenix (2015)	3.5	3.4	70	0.1
120	The Wolfpack (2015)	3.5	3.4	66	0.1
121	The Stanford Prison Experiment (2015)	4.0	3.9	51	0.1
122	Tangerine (2015)	4.0	3.9	36	0.1
123	Magic Mike XXL (2015)	4.5	4.4	9363	0.1