# Import pandas and extract data from CSV file

In [1]:
import pandas as pd
import numpy as np
from sqlalchemy import create_engine

In [2]:
#import Disney+ CSV file and create dataframe
csv_file = "Resources/disney_plus_titles.csv"
disney_df = pd.read_csv(csv_file)
disney_df.head()

Unnamed: 0,show_id,type,title,director,cast,country,date_added,release_year,rating,duration,listed_in,description
0,s1,Movie,A Spark Story,"Jason Sterman, Leanne Dare","Apthon Corbin, Louis Gonzales",,"September 24, 2021",2021,TV-PG,88 min,Documentary,Two Pixar filmmakers strive to bring their uni...
1,s2,Movie,Spooky Buddies,Robert Vince,"Tucker Albrizzi, Diedrich Bader, Ameko Eks Mas...","United States, Canada","September 24, 2021",2011,G,93 min,"Comedy, Fantasy, Kids",The puppies go on a spooky adventure through a...
2,s3,Movie,The Fault in Our Stars,Josh Boone,"Shailene Woodley, Ansel Elgort, Laura Dern, Sa...",United States,"September 24, 2021",2014,PG-13,127 min,"Coming of Age, Drama, Romance",Hazel and Gus share a love that sweeps them on...
3,s4,TV Show,Dog: Impossible,,Matt Beisner,United States,"September 22, 2021",2019,TV-PG,2 Seasons,"Animals & Nature, Docuseries, Family",Matt Beisner uses unique approaches to modifyi...
4,s5,TV Show,Spidey And His Amazing Friends,,"Benjamin Valic, Lily Sanfelippo, Jakari Fraser...",United States,"September 22, 2021",2021,TV-Y,1 Season,"Action-Adventure, Animation, Kids",Spidey teams up with pals to become The Spidey...


In [3]:
#import Netflix CSV file and create dataframe
csv_file = "Resources/netflix_titles.csv"
netflix_df = pd.read_csv(csv_file)
netflix_df.head()

Unnamed: 0,show_id,type,title,director,cast,country,date_added,release_year,rating,duration,listed_in,description
0,s1,Movie,Dick Johnson Is Dead,Kirsten Johnson,,United States,"September 25, 2021",2020,PG-13,90 min,Documentaries,"As her father nears the end of his life, filmm..."
1,s2,TV Show,Blood & Water,,"Ama Qamata, Khosi Ngema, Gail Mabalane, Thaban...",South Africa,"September 24, 2021",2021,TV-MA,2 Seasons,"International TV Shows, TV Dramas, TV Mysteries","After crossing paths at a party, a Cape Town t..."
2,s3,TV Show,Ganglands,Julien Leclercq,"Sami Bouajila, Tracy Gotoas, Samuel Jouy, Nabi...",,"September 24, 2021",2021,TV-MA,1 Season,"Crime TV Shows, International TV Shows, TV Act...",To protect his family from a powerful drug lor...
3,s4,TV Show,Jailbirds New Orleans,,,,"September 24, 2021",2021,TV-MA,1 Season,"Docuseries, Reality TV","Feuds, flirtations and toilet talk go down amo..."
4,s5,TV Show,Kota Factory,,"Mayur More, Jitendra Kumar, Ranjan Raj, Alam K...",India,"September 24, 2021",2021,TV-MA,2 Seasons,"International TV Shows, Romantic TV Shows, TV ...",In a city of coaching centers known to train I...


# Filter out anything that is not a movie

In [4]:
#Remove TV show type leaving Disney+ movies, create new dataframe
disney_movies_df = disney_df.loc[disney_df['type'] == 'Movie']
disney_movies_df.count()

show_id         991
type            991
title           991
director        928
cast            881
country         914
date_added      991
release_year    991
rating          990
duration        991
listed_in       991
description     991
dtype: int64

In [5]:
#Remove TV show type leaving Disney+ movies, create new dataframe
netflix_movies_df = netflix_df.loc[netflix_df['type'] == 'Movie']
netflix_movies_df.count()

show_id         6131
type            6131
title           6131
director        5943
cast            5656
country         5691
date_added      6131
release_year    6131
rating          6129
duration        6128
listed_in       6131
description     6131
dtype: int64

# Combining datatables and removing duplicates

In [6]:
# combined dataframe with all movies
movies_df = pd.concat([disney_movies_df, netflix_movies_df], axis=0)
movies_df.count()

show_id         7122
type            7122
title           7122
director        6871
cast            6537
country         6605
date_added      7122
release_year    7122
rating          7119
duration        7119
listed_in       7122
description     7122
dtype: int64

In [7]:
movies_list_df=movies_df.drop_duplicates(subset=['title'])
movies_list_df

Unnamed: 0,show_id,type,title,director,cast,country,date_added,release_year,rating,duration,listed_in,description
0,s1,Movie,A Spark Story,"Jason Sterman, Leanne Dare","Apthon Corbin, Louis Gonzales",,"September 24, 2021",2021,TV-PG,88 min,Documentary,Two Pixar filmmakers strive to bring their uni...
1,s2,Movie,Spooky Buddies,Robert Vince,"Tucker Albrizzi, Diedrich Bader, Ameko Eks Mas...","United States, Canada","September 24, 2021",2011,G,93 min,"Comedy, Fantasy, Kids",The puppies go on a spooky adventure through a...
2,s3,Movie,The Fault in Our Stars,Josh Boone,"Shailene Woodley, Ansel Elgort, Laura Dern, Sa...",United States,"September 24, 2021",2014,PG-13,127 min,"Coming of Age, Drama, Romance",Hazel and Gus share a love that sweeps them on...
6,s7,Movie,Confessions of a Shopaholic,P.J. Hogan,"Isla Fisher, Hugh Dancy, Joan Cusack, John Goo...",United States,"September 17, 2021",2009,PG,106 min,"Comedy, Romance, Romantic Comedy",Becky writes a personal finance column en rout...
7,s8,Movie,Descendants: Royal Wedding,Salvador Simó,"Dove Cameron, Sofia Carson, Booboo Stewart, Mi...",,"September 17, 2021",2021,TV-G,22 min,"Animation, Fantasy, Musical",Mal and Ben’s wedding is finally here!
...,...,...,...,...,...,...,...,...,...,...,...,...
8801,s8802,Movie,Zinzana,Majid Al Ansari,"Ali Suliman, Saleh Bakri, Yasa, Ali Al-Jabri, ...","United Arab Emirates, Jordan","March 9, 2016",2015,TV-MA,96 min,"Dramas, International Movies, Thrillers",Recovering alcoholic Talal wakes up inside a s...
8802,s8803,Movie,Zodiac,David Fincher,"Mark Ruffalo, Jake Gyllenhaal, Robert Downey J...",United States,"November 20, 2019",2007,R,158 min,"Cult Movies, Dramas, Thrillers","A political cartoonist, a crime reporter and a..."
8804,s8805,Movie,Zombieland,Ruben Fleischer,"Jesse Eisenberg, Woody Harrelson, Emma Stone, ...",United States,"November 1, 2019",2009,R,88 min,"Comedies, Horror Movies",Looking to survive in a world taken over by zo...
8805,s8806,Movie,Zoom,Peter Hewitt,"Tim Allen, Courteney Cox, Chevy Chase, Kate Ma...",United States,"January 11, 2020",2006,PG,88 min,"Children & Family Movies, Comedies","Dragged from civilian life, a former superhero..."


# Adding index and cleaning dataframe

In [8]:
movies_list_df = movies_list_df.assign(movie_id=movies_list_df.reset_index().index + 1)
movies_list_df

Unnamed: 0,show_id,type,title,director,cast,country,date_added,release_year,rating,duration,listed_in,description,movie_id
0,s1,Movie,A Spark Story,"Jason Sterman, Leanne Dare","Apthon Corbin, Louis Gonzales",,"September 24, 2021",2021,TV-PG,88 min,Documentary,Two Pixar filmmakers strive to bring their uni...,1
1,s2,Movie,Spooky Buddies,Robert Vince,"Tucker Albrizzi, Diedrich Bader, Ameko Eks Mas...","United States, Canada","September 24, 2021",2011,G,93 min,"Comedy, Fantasy, Kids",The puppies go on a spooky adventure through a...,2
2,s3,Movie,The Fault in Our Stars,Josh Boone,"Shailene Woodley, Ansel Elgort, Laura Dern, Sa...",United States,"September 24, 2021",2014,PG-13,127 min,"Coming of Age, Drama, Romance",Hazel and Gus share a love that sweeps them on...,3
6,s7,Movie,Confessions of a Shopaholic,P.J. Hogan,"Isla Fisher, Hugh Dancy, Joan Cusack, John Goo...",United States,"September 17, 2021",2009,PG,106 min,"Comedy, Romance, Romantic Comedy",Becky writes a personal finance column en rout...,4
7,s8,Movie,Descendants: Royal Wedding,Salvador Simó,"Dove Cameron, Sofia Carson, Booboo Stewart, Mi...",,"September 17, 2021",2021,TV-G,22 min,"Animation, Fantasy, Musical",Mal and Ben’s wedding is finally here!,5
...,...,...,...,...,...,...,...,...,...,...,...,...,...
8801,s8802,Movie,Zinzana,Majid Al Ansari,"Ali Suliman, Saleh Bakri, Yasa, Ali Al-Jabri, ...","United Arab Emirates, Jordan","March 9, 2016",2015,TV-MA,96 min,"Dramas, International Movies, Thrillers",Recovering alcoholic Talal wakes up inside a s...,7088
8802,s8803,Movie,Zodiac,David Fincher,"Mark Ruffalo, Jake Gyllenhaal, Robert Downey J...",United States,"November 20, 2019",2007,R,158 min,"Cult Movies, Dramas, Thrillers","A political cartoonist, a crime reporter and a...",7089
8804,s8805,Movie,Zombieland,Ruben Fleischer,"Jesse Eisenberg, Woody Harrelson, Emma Stone, ...",United States,"November 1, 2019",2009,R,88 min,"Comedies, Horror Movies",Looking to survive in a world taken over by zo...,7090
8805,s8806,Movie,Zoom,Peter Hewitt,"Tim Allen, Courteney Cox, Chevy Chase, Kate Ma...",United States,"January 11, 2020",2006,PG,88 min,"Children & Family Movies, Comedies","Dragged from civilian life, a former superhero...",7091


In [9]:
#dropped Show ID 
movies_list_df= movies_list_df.drop(['show_id', 'type'], axis = 1)
movies_list_df

Unnamed: 0,title,director,cast,country,date_added,release_year,rating,duration,listed_in,description,movie_id
0,A Spark Story,"Jason Sterman, Leanne Dare","Apthon Corbin, Louis Gonzales",,"September 24, 2021",2021,TV-PG,88 min,Documentary,Two Pixar filmmakers strive to bring their uni...,1
1,Spooky Buddies,Robert Vince,"Tucker Albrizzi, Diedrich Bader, Ameko Eks Mas...","United States, Canada","September 24, 2021",2011,G,93 min,"Comedy, Fantasy, Kids",The puppies go on a spooky adventure through a...,2
2,The Fault in Our Stars,Josh Boone,"Shailene Woodley, Ansel Elgort, Laura Dern, Sa...",United States,"September 24, 2021",2014,PG-13,127 min,"Coming of Age, Drama, Romance",Hazel and Gus share a love that sweeps them on...,3
6,Confessions of a Shopaholic,P.J. Hogan,"Isla Fisher, Hugh Dancy, Joan Cusack, John Goo...",United States,"September 17, 2021",2009,PG,106 min,"Comedy, Romance, Romantic Comedy",Becky writes a personal finance column en rout...,4
7,Descendants: Royal Wedding,Salvador Simó,"Dove Cameron, Sofia Carson, Booboo Stewart, Mi...",,"September 17, 2021",2021,TV-G,22 min,"Animation, Fantasy, Musical",Mal and Ben’s wedding is finally here!,5
...,...,...,...,...,...,...,...,...,...,...,...
8801,Zinzana,Majid Al Ansari,"Ali Suliman, Saleh Bakri, Yasa, Ali Al-Jabri, ...","United Arab Emirates, Jordan","March 9, 2016",2015,TV-MA,96 min,"Dramas, International Movies, Thrillers",Recovering alcoholic Talal wakes up inside a s...,7088
8802,Zodiac,David Fincher,"Mark Ruffalo, Jake Gyllenhaal, Robert Downey J...",United States,"November 20, 2019",2007,R,158 min,"Cult Movies, Dramas, Thrillers","A political cartoonist, a crime reporter and a...",7089
8804,Zombieland,Ruben Fleischer,"Jesse Eisenberg, Woody Harrelson, Emma Stone, ...",United States,"November 1, 2019",2009,R,88 min,"Comedies, Horror Movies",Looking to survive in a world taken over by zo...,7090
8805,Zoom,Peter Hewitt,"Tim Allen, Courteney Cox, Chevy Chase, Kate Ma...",United States,"January 11, 2020",2006,PG,88 min,"Children & Family Movies, Comedies","Dragged from civilian life, a former superhero...",7091


In [10]:
movies_list_df.rename(columns={"cast": "cast_name"}, inplace=True)
movies_list_df

Unnamed: 0,title,director,cast_name,country,date_added,release_year,rating,duration,listed_in,description,movie_id
0,A Spark Story,"Jason Sterman, Leanne Dare","Apthon Corbin, Louis Gonzales",,"September 24, 2021",2021,TV-PG,88 min,Documentary,Two Pixar filmmakers strive to bring their uni...,1
1,Spooky Buddies,Robert Vince,"Tucker Albrizzi, Diedrich Bader, Ameko Eks Mas...","United States, Canada","September 24, 2021",2011,G,93 min,"Comedy, Fantasy, Kids",The puppies go on a spooky adventure through a...,2
2,The Fault in Our Stars,Josh Boone,"Shailene Woodley, Ansel Elgort, Laura Dern, Sa...",United States,"September 24, 2021",2014,PG-13,127 min,"Coming of Age, Drama, Romance",Hazel and Gus share a love that sweeps them on...,3
6,Confessions of a Shopaholic,P.J. Hogan,"Isla Fisher, Hugh Dancy, Joan Cusack, John Goo...",United States,"September 17, 2021",2009,PG,106 min,"Comedy, Romance, Romantic Comedy",Becky writes a personal finance column en rout...,4
7,Descendants: Royal Wedding,Salvador Simó,"Dove Cameron, Sofia Carson, Booboo Stewart, Mi...",,"September 17, 2021",2021,TV-G,22 min,"Animation, Fantasy, Musical",Mal and Ben’s wedding is finally here!,5
...,...,...,...,...,...,...,...,...,...,...,...
8801,Zinzana,Majid Al Ansari,"Ali Suliman, Saleh Bakri, Yasa, Ali Al-Jabri, ...","United Arab Emirates, Jordan","March 9, 2016",2015,TV-MA,96 min,"Dramas, International Movies, Thrillers",Recovering alcoholic Talal wakes up inside a s...,7088
8802,Zodiac,David Fincher,"Mark Ruffalo, Jake Gyllenhaal, Robert Downey J...",United States,"November 20, 2019",2007,R,158 min,"Cult Movies, Dramas, Thrillers","A political cartoonist, a crime reporter and a...",7089
8804,Zombieland,Ruben Fleischer,"Jesse Eisenberg, Woody Harrelson, Emma Stone, ...",United States,"November 1, 2019",2009,R,88 min,"Comedies, Horror Movies",Looking to survive in a world taken over by zo...,7090
8805,Zoom,Peter Hewitt,"Tim Allen, Courteney Cox, Chevy Chase, Kate Ma...",United States,"January 11, 2020",2006,PG,88 min,"Children & Family Movies, Comedies","Dragged from civilian life, a former superhero...",7091


In [11]:
combined_movies_df = movies_list_df[["movie_id", 
                                     "title", 
                                     "director", 
                                     "cast_name", 
                                     "country", 
                                     "date_added", 
                                     "release_year", 
                                     "rating", 
                                     "duration", 
                                     "listed_in", 
                                     "description"]]
combined_movies_df

Unnamed: 0,movie_id,title,director,cast_name,country,date_added,release_year,rating,duration,listed_in,description
0,1,A Spark Story,"Jason Sterman, Leanne Dare","Apthon Corbin, Louis Gonzales",,"September 24, 2021",2021,TV-PG,88 min,Documentary,Two Pixar filmmakers strive to bring their uni...
1,2,Spooky Buddies,Robert Vince,"Tucker Albrizzi, Diedrich Bader, Ameko Eks Mas...","United States, Canada","September 24, 2021",2011,G,93 min,"Comedy, Fantasy, Kids",The puppies go on a spooky adventure through a...
2,3,The Fault in Our Stars,Josh Boone,"Shailene Woodley, Ansel Elgort, Laura Dern, Sa...",United States,"September 24, 2021",2014,PG-13,127 min,"Coming of Age, Drama, Romance",Hazel and Gus share a love that sweeps them on...
6,4,Confessions of a Shopaholic,P.J. Hogan,"Isla Fisher, Hugh Dancy, Joan Cusack, John Goo...",United States,"September 17, 2021",2009,PG,106 min,"Comedy, Romance, Romantic Comedy",Becky writes a personal finance column en rout...
7,5,Descendants: Royal Wedding,Salvador Simó,"Dove Cameron, Sofia Carson, Booboo Stewart, Mi...",,"September 17, 2021",2021,TV-G,22 min,"Animation, Fantasy, Musical",Mal and Ben’s wedding is finally here!
...,...,...,...,...,...,...,...,...,...,...,...
8801,7088,Zinzana,Majid Al Ansari,"Ali Suliman, Saleh Bakri, Yasa, Ali Al-Jabri, ...","United Arab Emirates, Jordan","March 9, 2016",2015,TV-MA,96 min,"Dramas, International Movies, Thrillers",Recovering alcoholic Talal wakes up inside a s...
8802,7089,Zodiac,David Fincher,"Mark Ruffalo, Jake Gyllenhaal, Robert Downey J...",United States,"November 20, 2019",2007,R,158 min,"Cult Movies, Dramas, Thrillers","A political cartoonist, a crime reporter and a..."
8804,7090,Zombieland,Ruben Fleischer,"Jesse Eisenberg, Woody Harrelson, Emma Stone, ...",United States,"November 1, 2019",2009,R,88 min,"Comedies, Horror Movies",Looking to survive in a world taken over by zo...
8805,7091,Zoom,Peter Hewitt,"Tim Allen, Courteney Cox, Chevy Chase, Kate Ma...",United States,"January 11, 2020",2006,PG,88 min,"Children & Family Movies, Comedies","Dragged from civilian life, a former superhero..."


# Creating streaming datatable and adding to streaming service dataframe

In [12]:
streaming_data = [[1, 'Netflix'], [2, 'Disney Plus']]
streaming_df = pd.DataFrame(streaming_data, columns = ['streaming_id', 'streaming_service_name'])
streaming_df

Unnamed: 0,streaming_id,streaming_service_name
0,1,Netflix
1,2,Disney Plus


In [None]:
#loop though the netflix df, compare the table with the title in the combined_movie_df

joined = []
for i, netflix_row in netflix_movies_df.interrows():
    title = disney_row['title']
    for j, movie_row in combined_movies_df.interrows():
        if title == movie_row['title']:
            id = movie_row['movie_id']
            join = [id,1]
            joined.append(join)
            break
            
print(joined)

In [None]:
joined
movie_streaming_df = pd.DataFrame(joined, columns = ['movie_id', 'streaming_id'])
movie_streaming_df

In [27]:
joined = []
for i, disney_row in disney_movies_df.interrows():
    title = disney_row['title']
    for j, movie_row in combined_movies_df.interrows():
        if title == movie_row['title']:
            id = movie_row['movie_id']
            join = [id,2]
            joined.append(join)
            break
            
print(joined)

AttributeError: 'DataFrame' object has no attribute 'interrows'