In [2]:
import pandas as pd 
import numpy as np
import matplotlib.pyplot as plt 
import seaborn as sns 
%matplotlib inline 
import plotly.graph_objects as go
import plotly.express as pex
import plotly.offline as py
from plotly.offline import init_notebook_mode, iplot
from plotly.subplots import make_subplots
import calmap
import squarify
from wordcloud import WordCloud, STOPWORDS, ImageColorGenerator
from collections import Counter

In [4]:
disney_plus = pd.read_csv('Resources/disney_plus_shows.csv')

disney_plus.head()

Unnamed: 0,imdb_id,title,plot,type,rated,year,released_at,added_at,runtime,genre,director,writer,actors,language,country,awards,metascore,imdb_rating,imdb_votes
0,tt0147800,10 Things I Hate About You,"A pretty, popular teenager can't go out on a d...",movie,PG-13,1999,31 Mar 1999,"November 12, 2019",97 min,"Comedy, Drama, Romance",Gil Junger,"Karen McCullah, Kirsten Smith","Heath Ledger, Julia Stiles, Joseph Gordon-Levi...","English, French",USA,2 wins & 13 nominations.,70.0,7.3,281399
1,tt7019028,101 Dalmatian Street,This series follows the lives of Delilah and D...,series,,2018–,25 Mar 2019,"February 28, 2020",,"Animation, Comedy, Family",,,"Josh Brener, Michaela Dietz, Bert Davis, Abiga...",English,"UK, USA, Canada",,,6.2,124
2,tt0115433,101 Dalmatians,An evil high-fashion designer plots to steal D...,movie,G,1996,27 Nov 1996,"November 12, 2019",103 min,"Adventure, Comedy, Crime, Family",Stephen Herek,"Dodie Smith (novel), John Hughes (screenplay)","Glenn Close, Jeff Daniels, Joely Richardson, J...","English, Spanish","USA, UK",Nominated for 1 Golden Globe. Another 3 wins &...,49.0,5.7,96739
3,tt0324941,101 Dalmatians 2: Patch's London Adventure,"Being one of 101 takes its toll on Patch, who ...",movie,G,2002,21 Jan 2003,"November 12, 2019",74 min,"Animation, Adventure, Comedy, Family, Musical","Jim Kammerud, Brian Smith","Jim Kammerud (story), Dan Root (story), Garret...","Barry Bostwick, Jason Alexander, Martin Short,...",English,USA,5 wins & 10 nominations.,,5.8,7299
4,tt0211181,102 Dalmatians,Cruella DeVil gets out of prison and goes afte...,movie,G,2000,22 Nov 2000,"November 12, 2019",100 min,"Adventure, Comedy, Family",Kevin Lima,"Dodie Smith (novel), Kristen Buckley (story), ...","Glenn Close, Gérard Depardieu, Ioan Gruffudd, ...",English,"USA, UK",Nominated for 1 Oscar. Another 1 win & 7 nomin...,35.0,4.9,33164


In [5]:
disney_plus.shape

(954, 19)

In [8]:
disney_df = disney_plus[['title','type','rated','added_at', 'genre','director','actors','country']]

disney_df.head()

Unnamed: 0,title,type,rated,added_at,genre,director,actors,country
0,10 Things I Hate About You,movie,PG-13,"November 12, 2019","Comedy, Drama, Romance",Gil Junger,"Heath Ledger, Julia Stiles, Joseph Gordon-Levi...",USA
1,101 Dalmatian Street,series,,"February 28, 2020","Animation, Comedy, Family",,"Josh Brener, Michaela Dietz, Bert Davis, Abiga...","UK, USA, Canada"
2,101 Dalmatians,movie,G,"November 12, 2019","Adventure, Comedy, Crime, Family",Stephen Herek,"Glenn Close, Jeff Daniels, Joely Richardson, J...","USA, UK"
3,101 Dalmatians 2: Patch's London Adventure,movie,G,"November 12, 2019","Animation, Adventure, Comedy, Family, Musical","Jim Kammerud, Brian Smith","Barry Bostwick, Jason Alexander, Martin Short,...",USA
4,102 Dalmatians,movie,G,"November 12, 2019","Adventure, Comedy, Family",Kevin Lima,"Glenn Close, Gérard Depardieu, Ioan Gruffudd, ...","USA, UK"


In [10]:
disney_df['added_at'] = pd.to_datetime(disney_df['added_at'])

disney_df.head()



A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy



Unnamed: 0,title,type,rated,added_at,genre,director,actors,country
0,10 Things I Hate About You,movie,PG-13,2019-11-12,"Comedy, Drama, Romance",Gil Junger,"Heath Ledger, Julia Stiles, Joseph Gordon-Levi...",USA
1,101 Dalmatian Street,series,,2020-02-28,"Animation, Comedy, Family",,"Josh Brener, Michaela Dietz, Bert Davis, Abiga...","UK, USA, Canada"
2,101 Dalmatians,movie,G,2019-11-12,"Adventure, Comedy, Crime, Family",Stephen Herek,"Glenn Close, Jeff Daniels, Joely Richardson, J...","USA, UK"
3,101 Dalmatians 2: Patch's London Adventure,movie,G,2019-11-12,"Animation, Adventure, Comedy, Family, Musical","Jim Kammerud, Brian Smith","Barry Bostwick, Jason Alexander, Martin Short,...",USA
4,102 Dalmatians,movie,G,2019-11-12,"Adventure, Comedy, Family",Kevin Lima,"Glenn Close, Gérard Depardieu, Ioan Gruffudd, ...","USA, UK"


In [11]:
disney_df.isnull().sum()

title        84
type         84
rated       235
added_at      0
genre        94
director    286
actors      109
country     108
dtype: int64

In [12]:
disney_df.shape

(954, 8)

In [16]:
disney_df = disney_df.dropna(subset=['director', 'actors','country'], how='any')
disney_df.shape

(643, 8)

In [17]:
disney_df.isnull().sum()

title        0
type         0
rated       65
added_at     0
genre        2
director     0
actors       0
country      0
dtype: int64

In [18]:
disney_df.dtypes

title               object
type                object
rated               object
added_at    datetime64[ns]
genre               object
director            object
actors              object
country             object
dtype: object

In [20]:
disney_df = disney_df.rename(columns={'type':'show_type',
                                     'rated': 'film_rating',
                                     'actors':'cast'})

disney_df

Unnamed: 0,title,show_type,film_rating,added_at,genre,director,cast,country
0,10 Things I Hate About You,movie,PG-13,2019-11-12,"Comedy, Drama, Romance",Gil Junger,"Heath Ledger, Julia Stiles, Joseph Gordon-Levi...",USA
2,101 Dalmatians,movie,G,2019-11-12,"Adventure, Comedy, Crime, Family",Stephen Herek,"Glenn Close, Jeff Daniels, Joely Richardson, J...","USA, UK"
3,101 Dalmatians 2: Patch's London Adventure,movie,G,2019-11-12,"Animation, Adventure, Comedy, Family, Musical","Jim Kammerud, Brian Smith","Barry Bostwick, Jason Alexander, Martin Short,...",USA
4,102 Dalmatians,movie,G,2019-11-12,"Adventure, Comedy, Family",Kevin Lima,"Glenn Close, Gérard Depardieu, Ioan Gruffudd, ...","USA, UK"
5,12 Dates of Christmas,movie,PG,2019-11-12,"Comedy, Fantasy, Romance",James Hayman,"Laura Miyata, Vijay Mehta, Amy Smart, Audrey D...",USA
6,"20,000 Leagues Under the Sea",movie,G,2019-11-12,"Adventure, Drama, Family, Fantasy, Sci-Fi",Richard Fleischer,"Kirk Douglas, James Mason, Paul Lukas, Peter L...",USA
7,A Bug's Life,movie,G,2019-11-12,"Animation, Adventure, Comedy, Family","John Lasseter, Andrew Stanton(co-director)","Dave Foley, Kevin Spacey, Julia Louis-Dreyfus,...",USA
9,A Goofy Movie,movie,G,2019-11-12,"Animation, Adventure, Comedy, Family, Musical,...",Kevin Lima,"Bill Farmer, Jason Marsden, Jim Cummings, Kell...","USA, Australia, France, Canada"
10,A Kid in King Arthur's Court,movie,PG,2019-11-12,"Adventure, Comedy, Family, Fantasy, Romance",Michael Gottlieb,"Thomas Ian Nicholas, Joss Ackland, Art Malik, ...","USA, Hungary, UK"
11,A Knight for a Day,movie,APPROVED,2019-11-12,"Animation, Short, Comedy",Jack Hannah,Pinto Colvig,USA


In [21]:
disney_df['month_added'] = pd.DatetimeIndex(disney_df['added_at']).month
disney_df['day_added'] = pd.DatetimeIndex(disney_df['added_at']).day
disney_df['year_added'] = pd.DatetimeIndex(disney_df['added_at']).year

disney_df.head()

Unnamed: 0,title,show_type,film_rating,added_at,genre,director,cast,country,month_added,day_added,year_added
0,10 Things I Hate About You,movie,PG-13,2019-11-12,"Comedy, Drama, Romance",Gil Junger,"Heath Ledger, Julia Stiles, Joseph Gordon-Levi...",USA,11,12,2019
2,101 Dalmatians,movie,G,2019-11-12,"Adventure, Comedy, Crime, Family",Stephen Herek,"Glenn Close, Jeff Daniels, Joely Richardson, J...","USA, UK",11,12,2019
3,101 Dalmatians 2: Patch's London Adventure,movie,G,2019-11-12,"Animation, Adventure, Comedy, Family, Musical","Jim Kammerud, Brian Smith","Barry Bostwick, Jason Alexander, Martin Short,...",USA,11,12,2019
4,102 Dalmatians,movie,G,2019-11-12,"Adventure, Comedy, Family",Kevin Lima,"Glenn Close, Gérard Depardieu, Ioan Gruffudd, ...","USA, UK",11,12,2019
5,12 Dates of Christmas,movie,PG,2019-11-12,"Comedy, Fantasy, Romance",James Hayman,"Laura Miyata, Vijay Mehta, Amy Smart, Audrey D...",USA,11,12,2019


In [31]:
disney_df_copy = disney_df.copy()

disney_df_copy.dtypes

title                  object
show_type              object
film_rating            object
added_at       datetime64[ns]
genre                  object
director               object
cast                   object
country                object
month_added             int64
day_added               int64
year_added              int64
dtype: object

In [27]:
dy_show_type = disney_df_copy['show_type'].value_counts().reset_index()

dy_show_type = dy_show_type.rename(columns={'index':'show_type',
                                           'show_type': 'Count'})
dy_show_type

pie_chart = go.Pie(labels=dy_show_type['show_type'], values=dy_show_type['Count'],
                   pull=[0.05,0],
                   marker = dict(colors=["#6ad49b", "#1f77b4"]))

fig_layout = go.Layout(title=" Distribution of Show Types on Disney +", height = 400, legend=dict(x=0.1, y=1.1))
fig = go.Figure(data= pie_chart, layout=fig_layout)
iplot(fig)


In [32]:
#Created a dict to change the numerics months to strings so easier to read on graph 
months = {'1': 'January', '2':'February', '3':'March','4':'April','10':'October', '11':'November','12':'December'}

#Change the date time month_released_on_nf column to string 
disney_df_copy['month_added'] = disney_df_copy['month_added'].astype(str)
disney_df_copy = disney_df_copy.replace({'month_added': months})

disney_df_copy.head()

Unnamed: 0,title,show_type,film_rating,added_at,genre,director,cast,country,month_added,day_added,year_added
0,10 Things I Hate About You,movie,PG-13,2019-11-12,"Comedy, Drama, Romance",Gil Junger,"Heath Ledger, Julia Stiles, Joseph Gordon-Levi...",USA,November,12,2019
2,101 Dalmatians,movie,G,2019-11-12,"Adventure, Comedy, Crime, Family",Stephen Herek,"Glenn Close, Jeff Daniels, Joely Richardson, J...","USA, UK",November,12,2019
3,101 Dalmatians 2: Patch's London Adventure,movie,G,2019-11-12,"Animation, Adventure, Comedy, Family, Musical","Jim Kammerud, Brian Smith","Barry Bostwick, Jason Alexander, Martin Short,...",USA,November,12,2019
4,102 Dalmatians,movie,G,2019-11-12,"Adventure, Comedy, Family",Kevin Lima,"Glenn Close, Gérard Depardieu, Ioan Gruffudd, ...","USA, UK",November,12,2019
5,12 Dates of Christmas,movie,PG,2019-11-12,"Comedy, Fantasy, Romance",James Hayman,"Laura Miyata, Vijay Mehta, Amy Smart, Audrey D...",USA,November,12,2019


In [39]:
month_releases = disney_df_copy['month_added'].value_counts().reset_index()
month_releases = month_releases.rename(columns = {'index':'Month','month_added':'Count'})

# month_releases
bar_graph = go.Bar(x=month_releases['Month'],y=month_releases['Count'], name="Number of Content Added", marker=dict(color="#6ad49b"))
data = [bar_graph]
layout = go.Layout(title="Number of content released by month", legend =dict(x=0.1, y=1.1))
fig =go.Figure(data,layout=layout)
fig.show()

Disney + officially launched in the United States on November 12, 2019. This explains the intial surge in content added. 