In [737]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

In [738]:
df = pd.read_csv("netflix.csv")

In [739]:
df.head()

Unnamed: 0,show_id,type,title,director,cast,country,date_added,release_year,rating,duration,listed_in,description
0,s1,Movie,Dick Johnson Is Dead,Kirsten Johnson,,United States,"September 25, 2021",2020,PG-13,90 min,Documentaries,"As her father nears the end of his life, filmm..."
1,s2,TV Show,Blood & Water,,"Ama Qamata, Khosi Ngema, Gail Mabalane, Thaban...",South Africa,"September 24, 2021",2021,TV-MA,2 Seasons,"International TV Shows, TV Dramas, TV Mysteries","After crossing paths at a party, a Cape Town t..."
2,s3,TV Show,Ganglands,Julien Leclercq,"Sami Bouajila, Tracy Gotoas, Samuel Jouy, Nabi...",,"September 24, 2021",2021,TV-MA,1 Season,"Crime TV Shows, International TV Shows, TV Act...",To protect his family from a powerful drug lor...
3,s4,TV Show,Jailbirds New Orleans,,,,"September 24, 2021",2021,TV-MA,1 Season,"Docuseries, Reality TV","Feuds, flirtations and toilet talk go down amo..."
4,s5,TV Show,Kota Factory,,"Mayur More, Jitendra Kumar, Ranjan Raj, Alam K...",India,"September 24, 2021",2021,TV-MA,2 Seasons,"International TV Shows, Romantic TV Shows, TV ...",In a city of coaching centers known to train I...


In [740]:
df.shape

(8807, 12)

In [741]:
# exploding comma seperated values into rows and filling up null values for director column
df_director = df.loc[:,("show_id","director")]
df_director.fillna("Not Avaliable", inplace = True)
df_director["director"] = df_director["director"].str.split(",")
df_director = df_director.explode("director")
df_director.head()

Unnamed: 0,show_id,director
0,s1,Kirsten Johnson
1,s2,Not Avaliable
2,s3,Julien Leclercq
3,s4,Not Avaliable
4,s5,Not Avaliable


In [742]:
# exploding comma seperated values into rows and filling up null values for cast column
df_cast = df.loc[:,("show_id","cast")]
df_cast.fillna("Not Avaliable", inplace = True)
df_cast["cast"] = df_cast["cast"].str.split(",")
df_cast = df_cast.explode("cast")
df_cast.head()

Unnamed: 0,show_id,cast
0,s1,Not Avaliable
1,s2,Ama Qamata
1,s2,Khosi Ngema
1,s2,Gail Mabalane
1,s2,Thabang Molaba


In [743]:
# exploding comma seperated values into rows and filling up null values for country column
df_country = df.loc[:,("show_id","country")]
df_country.fillna("Not Avaliable", inplace = True)
df_country["country"] = df_country["country"].str.split(",")
df_country = df_country.explode("country")
df_country.head()

Unnamed: 0,show_id,country
0,s1,United States
1,s2,South Africa
2,s3,Not Avaliable
3,s4,Not Avaliable
4,s5,India


In [744]:
# exploding comma seperated values into rows and filling up null values for listed_in column
df_listed_in = df.loc[:, ("show_id", "listed_in")]
df_listed_in["listed_in"] = df_listed_in["listed_in"].str.split(",")
df_listed_in = df_listed_in.explode("listed_in")
df_listed_in.head()

Unnamed: 0,show_id,listed_in
0,s1,Documentaries
1,s2,International TV Shows
1,s2,TV Dramas
1,s2,TV Mysteries
2,s3,Crime TV Shows


In [745]:
# merging 4 newly created dataframes in one using left join
df1 = pd.merge(df_director, df_cast, on = "show_id", how = "inner").merge(df_country, on = "show_id", how = "inner").merge(df_listed_in, on = "show_id", how = "inner")
df1.head()

Unnamed: 0,show_id,director,cast,country,listed_in
0,s1,Kirsten Johnson,Not Avaliable,United States,Documentaries
1,s2,Not Avaliable,Ama Qamata,South Africa,International TV Shows
2,s2,Not Avaliable,Ama Qamata,South Africa,TV Dramas
3,s2,Not Avaliable,Ama Qamata,South Africa,TV Mysteries
4,s2,Not Avaliable,Khosi Ngema,South Africa,International TV Shows


In [746]:
# removing columns from dataframes since they are explode[d]()
df2 = df.drop(columns = ["director", "cast", "country", "listed_in"])
df2.head()

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description
0,s1,Movie,Dick Johnson Is Dead,"September 25, 2021",2020,PG-13,90 min,"As her father nears the end of his life, filmm..."
1,s2,TV Show,Blood & Water,"September 24, 2021",2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t..."
2,s3,TV Show,Ganglands,"September 24, 2021",2021,TV-MA,1 Season,To protect his family from a powerful drug lor...
3,s4,TV Show,Jailbirds New Orleans,"September 24, 2021",2021,TV-MA,1 Season,"Feuds, flirtations and toilet talk go down amo..."
4,s5,TV Show,Kota Factory,"September 24, 2021",2021,TV-MA,2 Seasons,In a city of coaching centers known to train I...


In [747]:
# merging all the columns
netflix = df2.merge(df1, on = "show_id", how = "inner")
netflix.head()

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
0,s1,Movie,Dick Johnson Is Dead,"September 25, 2021",2020,PG-13,90 min,"As her father nears the end of his life, filmm...",Kirsten Johnson,Not Avaliable,United States,Documentaries
1,s2,TV Show,Blood & Water,"September 24, 2021",2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,International TV Shows
2,s2,TV Show,Blood & Water,"September 24, 2021",2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Dramas
3,s2,TV Show,Blood & Water,"September 24, 2021",2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Mysteries
4,s2,TV Show,Blood & Water,"September 24, 2021",2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Khosi Ngema,South Africa,International TV Shows


In [748]:
netflix.shape

(202065, 12)

In [749]:
netflix["date_added"] = pd.to_datetime(netflix["date_added"].str.strip(), format = "%B %d, %Y")
netflix.head()

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
0,s1,Movie,Dick Johnson Is Dead,2021-09-25,2020,PG-13,90 min,"As her father nears the end of his life, filmm...",Kirsten Johnson,Not Avaliable,United States,Documentaries
1,s2,TV Show,Blood & Water,2021-09-24,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,International TV Shows
2,s2,TV Show,Blood & Water,2021-09-24,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Dramas
3,s2,TV Show,Blood & Water,2021-09-24,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Mysteries
4,s2,TV Show,Blood & Water,2021-09-24,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Khosi Ngema,South Africa,International TV Shows


In [750]:
netflix["date_added"] = pd.to_datetime(netflix["release_year"], format = "%Y")
netflix.head()

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
0,s1,Movie,Dick Johnson Is Dead,2020-01-01,2020,PG-13,90 min,"As her father nears the end of his life, filmm...",Kirsten Johnson,Not Avaliable,United States,Documentaries
1,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,International TV Shows
2,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Dramas
3,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Mysteries
4,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Khosi Ngema,South Africa,International TV Shows


In [751]:
netflix.isna().sum()

show_id          0
type             0
title            0
date_added       0
release_year     0
rating          67
duration         3
description      0
director         0
cast             0
country          0
listed_in        0
dtype: int64

In [752]:
# there are some null values in rating we can fill these values by mode of ratings of movies produced by certain director or cast
netflix[netflix["rating"].isna()]

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
135172,s5990,Movie,13TH: A Conversation with Oprah Winfrey & Ava ...,2017-01-01,2017,,37 min,Oprah Winfrey sits down with director Ava DuVe...,Not Avaliable,Oprah Winfrey,Not Avaliable,Movies
135173,s5990,Movie,13TH: A Conversation with Oprah Winfrey & Ava ...,2017-01-01,2017,,37 min,Oprah Winfrey sits down with director Ava DuVe...,Not Avaliable,Ava DuVernay,Not Avaliable,Movies
154424,s6828,TV Show,Gargantia on the Verdurous Planet,2013-01-01,2013,,1 Season,"After falling through a wormhole, a space-dwel...",Not Avaliable,Kaito Ishikawa,Japan,Anime Series
154425,s6828,TV Show,Gargantia on the Verdurous Planet,2013-01-01,2013,,1 Season,"After falling through a wormhole, a space-dwel...",Not Avaliable,Kaito Ishikawa,Japan,International TV Shows
154426,s6828,TV Show,Gargantia on the Verdurous Planet,2013-01-01,2013,,1 Season,"After falling through a wormhole, a space-dwel...",Not Avaliable,Hisako Kanemoto,Japan,Anime Series
...,...,...,...,...,...,...,...,...,...,...,...,...
172016,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Francesco Migliore,Italy,Dramas
172017,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Albrecht Weimer,Italy,Dramas
172018,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Giulia Dichiaro,Italy,Dramas
172019,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Alessandra Oriti Niosi,Italy,Dramas


In [753]:
# replacing null values of rating of movies directed by Alessandro Pepe
netflix["director"][netflix["rating"].isna()].value_counts()

director
Not Avaliable      60
Alessandro Pepe     7
Name: count, dtype: int64

In [754]:
netflix[netflix["director"] == "Alessandro Pepe"]

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
172014,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Leone Frisa,Italy,Dramas
172015,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Paolo Vaccarino,Italy,Dramas
172016,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Francesco Migliore,Italy,Dramas
172017,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Albrecht Weimer,Italy,Dramas
172018,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Giulia Dichiaro,Italy,Dramas
172019,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Alessandra Oriti Niosi,Italy,Dramas
172020,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Andreas Segeritz,Italy,Dramas


Since movie produced by Alessandro Pepe is listed_in Dramas catergory find out the mode of ratings for this "Drama" category


In [755]:
netflix["rating"][netflix["listed_in"] == "Dramas"].value_counts()

rating
TV-MA    7465
TV-14    4208
R        3988
PG-13    2097
TV-PG    1048
PG        410
NR        265
TV-G       98
NC-17      39
UR         22
TV-Y7      10
Name: count, dtype: int64

Mode of Drama Category is TV-MA or TV - 14. Reading at at the movie description TV - MA is more suitable rating.

In [756]:
netflix.loc[netflix['director'] == 'Alessandro Pepe'] = netflix.loc[netflix['director'] == 'Alessandro Pepe'] .fillna("TV-MA")

In [757]:
netflix.loc[netflix['director'] == 'Alessandro Pepe']

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
172014,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,TV-MA,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Leone Frisa,Italy,Dramas
172015,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,TV-MA,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Paolo Vaccarino,Italy,Dramas
172016,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,TV-MA,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Francesco Migliore,Italy,Dramas
172017,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,TV-MA,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Albrecht Weimer,Italy,Dramas
172018,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,TV-MA,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Giulia Dichiaro,Italy,Dramas
172019,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,TV-MA,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Alessandra Oriti Niosi,Italy,Dramas
172020,s7538,Movie,My Honor Was Loyalty,2015-01-01,2015,TV-MA,115 min,"Amid the chaos and horror of World War II, a c...",Alessandro Pepe,Andreas Segeritz,Italy,Dramas


In [758]:
netflix["rating"][netflix["listed_in"] == "Anime Series"].value_counts()

rating
TV-MA    899
TV-14    871
TV-Y7    298
TV-PG    210
TV-Y      13
Name: count, dtype: int64

In [759]:
netflix[netflix["rating"].isna()]
netflix.loc[netflix['show_id'] == 's6828'] = netflix.loc[netflix['show_id'] == 's6828'].fillna("TV-MA")

In [760]:
netflix["rating"][netflix["listed_in"] == "Kids' TV"].value_counts()


rating
TV-Y7       2005
TV-Y        1081
TV-PG        378
TV-G         330
TV-Y7-FV       8
Name: count, dtype: int64

In [761]:
netflix.loc[netflix['show_id'] == 's7313'] = netflix.loc[netflix['show_id'] == 's7313'].fillna("TV-Y7")

In [762]:
netflix[netflix["cast"] == "Oprah Winfrey"]

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
89508,s3757,Movie,Oprah Presents When They See Us Now,2019-01-01,2019,TV-PG,61 min,Oprah Winfrey talks with the exonerated men on...,Mark Ritchie,Oprah Winfrey,United States,Documentaries
135172,s5990,Movie,13TH: A Conversation with Oprah Winfrey & Ava ...,2017-01-01,2017,,37 min,Oprah Winfrey sits down with director Ava DuVe...,Not Avaliable,Oprah Winfrey,Not Avaliable,Movies


In [763]:
netflix.loc[netflix['show_id'] == 's5990'] = netflix.loc[netflix['show_id'] == 's5990'].fillna("TV-PG")

In [764]:
netflix.isna().sum()

show_id         0
type            0
title           0
date_added      0
release_year    0
rating          0
duration        3
description     0
director        0
cast            0
country         0
listed_in       0
dtype: int64

In [765]:
netflix[netflix["duration"].isna()]

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
126582,s5542,Movie,Louis C.K. 2017,2017-01-01,2017,74 min,,"Louis C.K. muses on religion, eternal love, gi...",Louis C.K.,Louis C.K.,United States,Movies
131648,s5795,Movie,Louis C.K.: Hilarious,2010-01-01,2010,84 min,,Emmy-winning comedy writer Louis C.K. brings h...,Louis C.K.,Louis C.K.,United States,Movies
131782,s5814,Movie,Louis C.K.: Live at the Comedy Store,2015-01-01,2015,66 min,,The comic puts his trademark hilarious/thought...,Louis C.K.,Louis C.K.,United States,Movies


In [766]:
netflix.loc[netflix["director"] ==  "Louis C.K."]

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
126582,s5542,Movie,Louis C.K. 2017,2017-01-01,2017,74 min,,"Louis C.K. muses on religion, eternal love, gi...",Louis C.K.,Louis C.K.,United States,Movies
131648,s5795,Movie,Louis C.K.: Hilarious,2010-01-01,2010,84 min,,Emmy-winning comedy writer Louis C.K. brings h...,Louis C.K.,Louis C.K.,United States,Movies
131782,s5814,Movie,Louis C.K.: Live at the Comedy Store,2015-01-01,2015,66 min,,The comic puts his trademark hilarious/thought...,Louis C.K.,Louis C.K.,United States,Movies


Rating column should be in duration and rating should be null or fillna("TV-MA") (since most of content is TV-MA)

In [767]:
netflix.loc[netflix["director"] ==  "Louis C.K.", "duration"] = netflix.loc[netflix["director"] ==  "Louis C.K.", "rating"]
netflix.loc[netflix["director"] ==  "Louis C.K.", "rating"] = "TV-MA"

In [768]:
netflix.loc[netflix["director"] ==  "Louis C.K."]

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
126582,s5542,Movie,Louis C.K. 2017,2017-01-01,2017,TV-MA,74 min,"Louis C.K. muses on religion, eternal love, gi...",Louis C.K.,Louis C.K.,United States,Movies
131648,s5795,Movie,Louis C.K.: Hilarious,2010-01-01,2010,TV-MA,84 min,Emmy-winning comedy writer Louis C.K. brings h...,Louis C.K.,Louis C.K.,United States,Movies
131782,s5814,Movie,Louis C.K.: Live at the Comedy Store,2015-01-01,2015,TV-MA,66 min,The comic puts his trademark hilarious/thought...,Louis C.K.,Louis C.K.,United States,Movies


In [769]:
netflix.isna().sum()

show_id         0
type            0
title           0
date_added      0
release_year    0
rating          0
duration        0
description     0
director        0
cast            0
country         0
listed_in       0
dtype: int64

In [770]:
netflix.head()

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
0,s1,Movie,Dick Johnson Is Dead,2020-01-01,2020,PG-13,90 min,"As her father nears the end of his life, filmm...",Kirsten Johnson,Not Avaliable,United States,Documentaries
1,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,International TV Shows
2,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Dramas
3,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Mysteries
4,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Khosi Ngema,South Africa,International TV Shows


In [771]:
# Stripping the Extra spaces in data
netflix.loc[:, "director"] = netflix.loc[:, "director"].str.strip()
netflix.loc[:, "cast"] = netflix.loc[:, "cast"].str.strip()
netflix.loc[:, "country"] = netflix.loc[:, "country"].str.strip()
netflix.loc[:, "listed_in"] = netflix.loc[:, "listed_in"].str.strip()
netflix.loc[:, "title"] = netflix.loc[:, "title"].str.strip()

In [772]:
netflix.head()

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
0,s1,Movie,Dick Johnson Is Dead,2020-01-01,2020,PG-13,90 min,"As her father nears the end of his life, filmm...",Kirsten Johnson,Not Avaliable,United States,Documentaries
1,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,International TV Shows
2,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Dramas
3,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Mysteries
4,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2 Seasons,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Khosi Ngema,South Africa,International TV Shows


In [773]:
# Splitting the dataframe into 2 type 1st Movies, 2nd TV Show
df_movies = netflix.loc[netflix["type"] == "Movie"].reset_index()
df_shows = netflix.loc[netflix["type"] == "TV Show"].reset_index()
netflix = pd.concat([df_movies, df_shows], axis=0).reset_index()

In [774]:
# fixing duration column in df_movie
df_movies["duration"] = df_movies["duration"].str.split(" ")
df_movies["duration"] = int(df_movies["duration"][0][0])


In [775]:
df_movies.head()

Unnamed: 0,index,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
0,0,s1,Movie,Dick Johnson Is Dead,2020-01-01,2020,PG-13,90,"As her father nears the end of his life, filmm...",Kirsten Johnson,Not Avaliable,United States,Documentaries
1,159,s7,Movie,My Little Pony: A New Generation,2021-01-01,2021,PG,90,Equestria's divided. But a bright-eyed hero be...,Robert Cullen,Vanessa Hudgens,Not Avaliable,Children & Family Movies
2,160,s7,Movie,My Little Pony: A New Generation,2021-01-01,2021,PG,90,Equestria's divided. But a bright-eyed hero be...,Robert Cullen,Kimiko Glenn,Not Avaliable,Children & Family Movies
3,161,s7,Movie,My Little Pony: A New Generation,2021-01-01,2021,PG,90,Equestria's divided. But a bright-eyed hero be...,Robert Cullen,James Marsden,Not Avaliable,Children & Family Movies
4,162,s7,Movie,My Little Pony: A New Generation,2021-01-01,2021,PG,90,Equestria's divided. But a bright-eyed hero be...,Robert Cullen,Sofia Carson,Not Avaliable,Children & Family Movies


In [776]:
# fixing duration column in df_shows
df_shows["duration"] = df_shows["duration"].str.split(" ")
df_shows["duration"] = int(df_shows["duration"][0][0])

In [777]:
df_shows.head()

Unnamed: 0,index,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
0,1,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,International TV Shows
1,2,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Dramas
2,3,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Ama Qamata,South Africa,TV Mysteries
3,4,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Khosi Ngema,South Africa,International TV Shows
4,5,s2,TV Show,Blood & Water,2021-01-01,2021,TV-MA,2,"After crossing paths at a party, a Cape Town t...",Not Avaliable,Khosi Ngema,South Africa,TV Dramas


Data Cleaning and Exploration:
How many missing values exist in each column and how will they be handled?
Are there any duplicate records in the dataset? If yes, how many?
What are the data types of each column? Are there any columns with incorrect data types that need to be converted for further analysis?

Top Shows/Movies Analysis:
Which are the top 10 rated shows/movies in the dataset?
What are the most common genres of shows/movies available on Netflix? How are they distributed?
How do ratings vary across different genres?

Time Analysis:
What is the trend in the number of shows/movies released over the years?
How has the frequency of shows/movies being added to Netflix changed over time?
Is there a particular time of the year when more shows/movies are added?

Recommendations and Insights:
Based on genres, which types of shows/movies should Netflix consider adding more of?
Are there seasonal trends in the popularity of certain genres of shows/movies?

Additional Analysis:
What is the typical duration of shows/movies on Netflix? How does this vary by genre?
Which countries produce the most content for Netflix? How does content popularity vary by country?
Presentation and Communication:
Which type of visualization would best represent each of the insights gathered from the data?
How can data storytelling be applied to present the case study effectively to a non-technical audience?

In [782]:
netflix.drop(columns = ["level_0", "index"], inplace = True)

In [783]:
netflix.head()

Unnamed: 0,show_id,type,title,date_added,release_year,rating,duration,description,director,cast,country,listed_in
0,s1,Movie,Dick Johnson Is Dead,2020-01-01,2020,PG-13,90 min,"As her father nears the end of his life, filmm...",Kirsten Johnson,Not Avaliable,United States,Documentaries
1,s7,Movie,My Little Pony: A New Generation,2021-01-01,2021,PG,91 min,Equestria's divided. But a bright-eyed hero be...,Robert Cullen,Vanessa Hudgens,Not Avaliable,Children & Family Movies
2,s7,Movie,My Little Pony: A New Generation,2021-01-01,2021,PG,91 min,Equestria's divided. But a bright-eyed hero be...,Robert Cullen,Kimiko Glenn,Not Avaliable,Children & Family Movies
3,s7,Movie,My Little Pony: A New Generation,2021-01-01,2021,PG,91 min,Equestria's divided. But a bright-eyed hero be...,Robert Cullen,James Marsden,Not Avaliable,Children & Family Movies
4,s7,Movie,My Little Pony: A New Generation,2021-01-01,2021,PG,91 min,Equestria's divided. But a bright-eyed hero be...,Robert Cullen,Sofia Carson,Not Avaliable,Children & Family Movies
