In [1]:
import pandas as pd 
import numpy as np 
import matplotlib.pyplot as plt 
%matplotlib inline 
import seaborn as sns 
pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', 500)

In [2]:
movies = pd.read_csv('netflix_titles-2.csv')
movies.head()

Unnamed: 0,show_id,type,title,director,cast,country,date_added,release_year,rating,duration,listed_in,description
0,s1,TV Show,3%,,"João Miguel, Bianca Comparato, Michel Gomes, R...",Brazil,"August 14, 2020",2020,TV-MA,4 Seasons,"International TV Shows, TV Dramas, TV Sci-Fi &...",In a future where the elite inhabit an island ...
1,s2,Movie,7:19,Jorge Michel Grau,"Demián Bichir, Héctor Bonilla, Oscar Serrano, ...",Mexico,"December 23, 2016",2016,TV-MA,93 min,"Dramas, International Movies",After a devastating earthquake hits Mexico Cit...
2,s3,Movie,23:59,Gilbert Chan,"Tedd Chan, Stella Chung, Henley Hii, Lawrence ...",Singapore,"December 20, 2018",2011,R,78 min,"Horror Movies, International Movies","When an army recruit is found dead, his fellow..."
3,s4,Movie,9,Shane Acker,"Elijah Wood, John C. Reilly, Jennifer Connelly...",United States,"November 16, 2017",2009,PG-13,80 min,"Action & Adventure, Independent Movies, Sci-Fi...","In a postapocalyptic world, rag-doll robots hi..."
4,s5,Movie,21,Robert Luketic,"Jim Sturgess, Kevin Spacey, Kate Bosworth, Aar...",United States,"January 1, 2020",2008,PG-13,123 min,Dramas,A brilliant group of students become card-coun...


In [3]:
len(movies)

7787

In [4]:
movies.drop_duplicates(inplace=True)

In [5]:
len(movies) # Tells me there are no duplicate rows. Great! 

7787

### Total missing values from every column

In [6]:
movies.isnull().sum()

show_id            0
type               0
title              0
director        2389
cast             718
country          507
date_added        10
release_year       0
rating             7
duration           0
listed_in          0
description        0
dtype: int64

#### What kind of data is really missing? 

- US & UK shows have the maximum empty rows for directors 
- Missing data is distributed among both TV shows and Movies but more number of TV shows do not have a director listed in the data than in the movies. 
        - However, if you think about it - there could be more number of TV shows in the data than there are movies. So, let's take a % of missing data per total TV shows. 
        - After looking at all data, it turns out TV shows have more missing director data than Movies. 

In [7]:
df = pd.pivot_table(data=movies[movies['director'].isnull()==True], index='country',  values= 'show_id', aggfunc='count')

In [8]:
df.sort_values(by="show_id", ascending=False)

Unnamed: 0_level_0,show_id
country,Unnamed: 1_level_1
United States,717
United Kingdom,196
Japan,148
South Korea,139
India,75
Taiwan,63
Canada,62
Australia,45
France,42
Spain,37


In [9]:
df = pd.pivot_table(data=movies[movies['director'].isnull()==True], index='country', columns='type',  values= 'show_id', aggfunc='count')

In [10]:
df

type,Movie,TV Show
country,Unnamed: 1_level_1,Unnamed: 2_level_1
Argentina,,14.0
"Argentina, Spain",1.0,1.0
"Argentina, United States, Mexico",,1.0
Australia,,45.0
"Australia, Canada",,1.0
"Australia, New Zealand",,1.0
"Australia, New Zealand, United States",,1.0
"Australia, United States",,3.0
"Austria, Germany",,1.0
Belarus,,1.0


In [11]:
df.sort_values(by="TV Show", ascending=False)

type,Movie,TV Show
country,Unnamed: 1_level_1,Unnamed: 2_level_1
United States,54.0,663.0
United Kingdom,13.0,183.0
Japan,1.0,147.0
South Korea,2.0,137.0
India,12.0,63.0
Taiwan,1.0,62.0
Canada,6.0,56.0
Australia,,45.0
France,,42.0
Spain,2.0,35.0


In [12]:
# Reflects only missing data values 
pd.pivot_table(data=movies[movies['director'].isnull()==True],  columns='type',  values= 'show_id', aggfunc='count')

type,Movie,TV Show
show_id,163,2226


In [13]:
# Reflects data with NO missing director field. 
pd.pivot_table(data=movies[movies['director'].isnull()==False],  columns='type',  values= 'show_id', aggfunc='count')

type,Movie,TV Show
show_id,5214,184


In [14]:
df = pd.pivot_table(data=movies[movies['cast'].isnull()==True], index='country',  values= 'show_id', aggfunc='count')

In [15]:
df.sort_values(by="show_id", ascending=False)

Unnamed: 0_level_0,show_id
country,Unnamed: 1_level_1
United States,304
United Kingdom,65
India,29
Canada,18
Spain,17
France,16
Australia,9
Brazil,9
Mexico,8
Germany,6


In [16]:
movies['release_year'].sort_values(ascending=True)

4867    1925
6117    1942
4960    1942
7679    1943
7342    1943
7616    1943
7268    1944
6699    1944
6657    1944
5371    1945
3425    1945
4436    1945
3608    1946
4866    1946
7072    1947
7595    1954
6141    1954
6868    1955
5425    1955
5122    1955
1620    1956
2233    1956
1241    1958
2410    1958
1169    1958
7302    1959
3187    1960
4563    1960
5624    1960
1152    1960
4300    1962
3707    1962
4981    1962
5351    1963
6953    1963
5376    1964
6221    1965
1793    1965
480     1966
7538    1967
6082    1967
1041    1967
1497    1967
7609    1967
1344    1968
5285    1968
6793    1968
4635    1968
5785    1968
4970    1969
7242    1969
6255    1970
6544    1970
1970    1971
7628    1971
165     1971
3525    1971
2152    1971
770     1972
5907    1972
4216    1972
3442    1972
4008    1973
7737    1973
6850    1973
1283    1973
1414    1973
1016    1973
3176    1973
3131    1973
2013    1973
3358    1973
6613    1974
4217    1974
392     1974
2953    1974
3915    1974

### What does release year look like?

- Movies data ranges from 1925 release year to 2021

In [17]:
movies['release_year'].min()

1925

In [18]:
movies['release_year'].max()

2021

In [19]:
movies.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 7787 entries, 0 to 7786
Data columns (total 12 columns):
show_id         7787 non-null object
type            7787 non-null object
title           7787 non-null object
director        5398 non-null object
cast            7069 non-null object
country         7280 non-null object
date_added      7777 non-null object
release_year    7787 non-null int64
rating          7780 non-null object
duration        7787 non-null object
listed_in       7787 non-null object
description     7787 non-null object
dtypes: int64(1), object(11)
memory usage: 790.9+ KB


### What numerical data do we have in this dataset?

In [20]:
movies.describe() # Just release year

Unnamed: 0,release_year
count,7787.0
mean,2013.93258
std,8.757395
min,1925.0
25%,2013.0
50%,2017.0
75%,2018.0
max,2021.0


In [21]:
movies.head(3)

Unnamed: 0,show_id,type,title,director,cast,country,date_added,release_year,rating,duration,listed_in,description
0,s1,TV Show,3%,,"João Miguel, Bianca Comparato, Michel Gomes, R...",Brazil,"August 14, 2020",2020,TV-MA,4 Seasons,"International TV Shows, TV Dramas, TV Sci-Fi &...",In a future where the elite inhabit an island ...
1,s2,Movie,7:19,Jorge Michel Grau,"Demián Bichir, Héctor Bonilla, Oscar Serrano, ...",Mexico,"December 23, 2016",2016,TV-MA,93 min,"Dramas, International Movies",After a devastating earthquake hits Mexico Cit...
2,s3,Movie,23:59,Gilbert Chan,"Tedd Chan, Stella Chung, Henley Hii, Lawrence ...",Singapore,"December 20, 2018",2011,R,78 min,"Horror Movies, International Movies","When an army recruit is found dead, his fellow..."


### Looks like some movies are more popular than the other, let's break down the "listed_in" category

In [30]:
movies.iloc[7784]

show_id                                                     s7785
type                                                        Movie
title                                           Zulu Man in Japan
director                                                      NaN
cast                                                      Nasty C
country                                                       NaN
date_added                                     September 25, 2020
release_year                                                 2019
rating                                                      TV-MA
duration                                                   44 min
listed_in       Documentaries, International Movies, Music & M...
description     In this documentary, South African rapper Nast...
Name: 7784, dtype: object

In [33]:
pd.set_option('display.max_colwidth', 500)
movies[["show_id", "release_year","listed_in"]]

Unnamed: 0,show_id,release_year,listed_in
0,s1,2020,"International TV Shows, TV Dramas, TV Sci-Fi & Fantasy"
1,s2,2016,"Dramas, International Movies"
2,s3,2011,"Horror Movies, International Movies"
3,s4,2009,"Action & Adventure, Independent Movies, Sci-Fi & Fantasy"
4,s5,2008,Dramas
5,s6,2016,"International TV Shows, TV Dramas, TV Mysteries"
6,s7,2019,"Horror Movies, International Movies"
7,s8,1997,Dramas
8,s9,2019,"Horror Movies, International Movies"
9,s10,2008,"Horror Movies, International Movies, Thrillers"


In [34]:
movies[["Cat1", "Cat2", "Cat3"]]= movies["listed_in"].apply(lambda x: pd.Series(str(x).split(sep=",")))

In [62]:
movies[["Cat1", "Cat2", "Cat3"]].count(axis=0)

Cat1    7787
Cat2    5986
Cat3    3298
dtype: int64

In [38]:
movies.tail(10)

Unnamed: 0,show_id,type,title,director,cast,country,date_added,release_year,rating,duration,listed_in,description,Cat1,Cat2,Cat3
7777,s7778,TV Show,Zombie Dumb,,,,"July 1, 2019",2018,TV-Y7,2 Seasons,"Kids' TV, Korean TV Shows, TV Comedies","While living alone in a spooky town, a young girl befriends a motley crew of zombie children with diverse personalities.",Kids' TV,Korean TV Shows,TV Comedies
7778,s7779,Movie,Zombieland,Ruben Fleischer,"Jesse Eisenberg, Woody Harrelson, Emma Stone, Abigail Breslin, Amber Heard, Bill Murray, Derek Graf",United States,"November 1, 2019",2009,R,88 min,"Comedies, Horror Movies","Looking to survive in a world taken over by zombies, a dorky college student teams with an urban roughneck and a pair of grifter sisters.",Comedies,Horror Movies,
7779,s7780,TV Show,Zona Rosa,,"Manu NNa, Ana Julia Yeyé, Ray Contreras, Pablo Morán",Mexico,"November 26, 2019",2019,TV-MA,1 Season,"International TV Shows, Spanish-Language TV Shows, Stand-Up Comedy & Talk Shows",An assortment of talent takes the stage for a night of honest stand-up featuring four of Mexico's funniest LGBTQ comedians.,International TV Shows,Spanish-Language TV Shows,Stand-Up Comedy & Talk Shows
7780,s7781,Movie,Zoo,Shlok Sharma,"Shashank Arora, Shweta Tripathi, Rahul Kumar, Gopal K. Singh, Yogesh Kurme, Prince Daniel",India,"July 1, 2018",2018,TV-MA,94 min,"Dramas, Independent Movies, International Movies","A drug dealer starts having doubts about his trade as his brother, his client, and two rappers from the slums each battle their own secret addictions.",Dramas,Independent Movies,International Movies
7781,s7782,Movie,Zoom,Peter Hewitt,"Tim Allen, Courteney Cox, Chevy Chase, Kate Mara, Ryan Newman, Michael Cassidy, Spencer Breslin, Rip Torn, Kevin Zegers",United States,"January 11, 2020",2006,PG,88 min,"Children & Family Movies, Comedies","Dragged from civilian life, a former superhero must train a new crop of youthful saviors when the military preps for an attack by a familiar villain.",Children & Family Movies,Comedies,
7782,s7783,Movie,Zozo,Josef Fares,"Imad Creidi, Antoinette Turk, Elias Gergi, Carmen Lebbos, Viktor Axelsson, Charbel Iskandar, Yasmine Awad","Sweden, Czech Republic, United Kingdom, Denmark, Netherlands","October 19, 2020",2005,TV-MA,99 min,"Dramas, International Movies","When Lebanon's Civil War deprives Zozo of his family, he's left with grief and little means as he escapes to Sweden in search of his grandparents.",Dramas,International Movies,
7783,s7784,Movie,Zubaan,Mozez Singh,"Vicky Kaushal, Sarah-Jane Dias, Raaghav Chanana, Manish Chaudhary, Meghna Malik, Malkeet Rauni, Anita Shabdish, Chittaranjan Tripathy",India,"March 2, 2019",2015,TV-14,111 min,"Dramas, International Movies, Music & Musicals","A scrappy but poor boy worms his way into a tycoon's dysfunctional family, while facing his fear of music and the truth about his past.",Dramas,International Movies,Music & Musicals
7784,s7785,Movie,Zulu Man in Japan,,Nasty C,,"September 25, 2020",2019,TV-MA,44 min,"Documentaries, International Movies, Music & Musicals","In this documentary, South African rapper Nasty C hits the stage and streets of Tokyo, introducing himself to the city's sights, sounds and culture.",Documentaries,International Movies,Music & Musicals
7785,s7786,TV Show,Zumbo's Just Desserts,,"Adriano Zumbo, Rachel Khoo",Australia,"October 31, 2020",2019,TV-PG,1 Season,"International TV Shows, Reality TV","Dessert wizard Adriano Zumbo looks for the next “Willy Wonka” in this tense competition that finds skilled amateurs competing for a $100,000 prize.",International TV Shows,Reality TV,
7786,s7787,Movie,ZZ TOP: THAT LITTLE OL' BAND FROM TEXAS,Sam Dunn,,"United Kingdom, Canada, United States","March 1, 2020",2019,TV-MA,90 min,"Documentaries, Music & Musicals",This documentary delves into the mystique behind the blues-rock trio and explores how the enigmatic band created their iconic look and sound.,Documentaries,Music & Musicals,


In [37]:
movies["title"].unique()

array(['3%', '7:19', '23:59', ..., 'Zulu Man in Japan',
       "Zumbo's Just Desserts", "ZZ TOP: THAT LITTLE OL' BAND FROM TEXAS"], dtype=object)

In [39]:
movies["rating"].unique()

array(['TV-MA', 'R', 'PG-13', 'TV-14', 'TV-PG', 'NR', 'TV-G', 'TV-Y', nan,
       'TV-Y7', 'PG', 'G', 'NC-17', 'TV-Y7-FV', 'UR'], dtype=object)

### Do all TV shows has seasons?

- Separating out TV show seasons from Movie length

In [40]:
movies["duration"].unique()

array(['4 Seasons', '93 min', '78 min', '80 min', '123 min', '1 Season',
       '95 min', '119 min', '118 min', '143 min', '103 min', '89 min',
       '91 min', '149 min', '144 min', '124 min', '87 min', '110 min',
       '128 min', '117 min', '100 min', '2 Seasons', '84 min', '99 min',
       '90 min', '102 min', '104 min', '105 min', '56 min', '125 min',
       '81 min', '97 min', '106 min', '107 min', '109 min', '44 min',
       '75 min', '101 min', '3 Seasons', '37 min', '113 min', '114 min',
       '130 min', '94 min', '140 min', '135 min', '82 min', '70 min',
       '121 min', '92 min', '164 min', '53 min', '83 min', '116 min',
       '86 min', '120 min', '96 min', '126 min', '129 min', '77 min',
       '137 min', '148 min', '28 min', '122 min', '176 min', '85 min',
       '22 min', '68 min', '111 min', '29 min', '142 min', '168 min',
       '21 min', '59 min', '20 min', '98 min', '108 min', '76 min',
       '26 min', '156 min', '30 min', '57 min', '150 min', '133 min',
       '1

In [44]:
movies[movies["type"]=="TV Show"]["duration"]

0        4 Seasons
5         1 Season
11        1 Season
12        1 Season
16        1 Season
24       2 Seasons
26        1 Season
29        1 Season
38        1 Season
45        1 Season
51        1 Season
53        1 Season
58        1 Season
61        1 Season
63       4 Seasons
64       3 Seasons
80        1 Season
85        1 Season
86        1 Season
87        1 Season
95        1 Season
108      2 Seasons
111      2 Seasons
112       1 Season
130       1 Season
132       1 Season
134       1 Season
137       1 Season
138       1 Season
139       1 Season
140       1 Season
141      2 Seasons
142       1 Season
152       1 Season
180       1 Season
188       1 Season
191       1 Season
195       1 Season
197       1 Season
198       1 Season
199       1 Season
202       1 Season
213       1 Season
218       1 Season
225      3 Seasons
235       1 Season
239       1 Season
241       1 Season
248      2 Seasons
256       1 Season
258      2 Seasons
259       1 Season
260       1 

In [53]:
movies[movies["type"]=="TV Show"]

Unnamed: 0,show_id,type,title,director,cast,country,date_added,release_year,rating,duration,listed_in,description,Cat1,Cat2,Cat3,Seasons,Movie length
0,s1,TV Show,3%,,"João Miguel, Bianca Comparato, Michel Gomes, Rodolfo Valente, Vaneza Oliveira, Rafael Lozano, Viviane Porto, Mel Fronckowiak, Sergio Mamberti, Zezé Motta, Celso Frateschi",Brazil,"August 14, 2020",2020,TV-MA,4 Seasons,"International TV Shows, TV Dramas, TV Sci-Fi & Fantasy","In a future where the elite inhabit an island paradise far from the crowded slums, you get one chance to join the 3% saved from squalor.",International TV Shows,TV Dramas,TV Sci-Fi & Fantasy,4,
5,s6,TV Show,46,Serdar Akar,"Erdal Beşikçioğlu, Yasemin Allen, Melis Birkan, Saygın Soysal, Berkan Şal, Metin Belgin, Ayça Eren, Selin Uludoğan, Özay Fecht, Suna Yıldızoğlu",Turkey,"July 1, 2017",2016,TV-MA,1 Season,"International TV Shows, TV Dramas, TV Mysteries","A genetics professor experiments with a treatment for his comatose sister that blends medical and shamanic cures, but unlocks a shocking side effect.",International TV Shows,TV Dramas,TV Mysteries,1,
11,s12,TV Show,1983,,"Robert Więckiewicz, Maciej Musiał, Michalina Olszańska, Andrzej Chyra, Clive Russell, Zofia Wichłacz, Edyta Olszówka, Mateusz Kościukiewicz, Ewa Błaszczyk, Vu Le Hong, Tomasz Włosok, Krzysztof Wach","Poland, United States","November 30, 2018",2018,TV-MA,1 Season,"Crime TV Shows, International TV Shows, TV Dramas","In this dark alt-history thriller, a naïve law student and a world-weary detective uncover a conspiracy that has tyrannized Poland for decades.",Crime TV Shows,International TV Shows,TV Dramas,1,
12,s13,TV Show,1994,Diego Enrique Osorno,,Mexico,"May 17, 2019",2019,TV-MA,1 Season,"Crime TV Shows, Docuseries, International TV Shows","Archival video and new interviews examine Mexican politics in 1994, a year marked by the rise of the EZLN and the assassination of Luis Donaldo Colosio.",Crime TV Shows,Docuseries,International TV Shows,1,
16,s17,TV Show,Feb-09,,"Shahd El Yaseen, Shaila Sabt, Hala, Hanadi Al-Kandari, Salma Salem, Ibrahim Al-Harbi, Mahmoud Boushahri, Yousef Al Balushi, Ghorour, Abdullah Al-bloshi",,"March 20, 2019",2018,TV-14,1 Season,"International TV Shows, TV Dramas","As a psychology professor faces Alzheimer's, his daughter and her three close female friends experience romance, marriage, heartbreak and tragedy.",International TV Shows,TV Dramas,,1,
24,s25,TV Show,​SAINT SEIYA: Knights of the Zodiac,,"Bryson Baugus, Emily Neves, Blake Shepard, Patrick Poole, Luci Christian, Adam Gibbs, Masakazu Morita, Fumiko Orikasa, Takahiro Sakurai, Hiroaki Miura, Satomi Sato, Katsuyuki Konishi",Japan,"January 23, 2020",2020,TV-14,2 Seasons,"Anime Series, International TV Shows","Seiya and the Knights of the Zodiac rise again to protect the reincarnation of the goddess Athena, but a dark prophecy hangs over them all.",Anime Series,International TV Shows,,2,
26,s27,TV Show,(Un)Well,,,United States,"August 12, 2020",2020,TV-MA,1 Season,Reality TV,"This docuseries takes a deep dive into the lucrative wellness industry, which touts health and healing. But do the products live up to the promises?",Reality TV,,,1,
29,s30,TV Show,#blackAF,,"Kenya Barris, Rashida Jones, Iman Benson, Genneya Walton, Scarlet Spencer, Justin Claiborne, Ravi Cabot-Conyers",United States,"April 17, 2020",2020,TV-MA,1 Season,TV Comedies,"Kenya Barris and his family navigate relationships, race and culture while grappling with their newfound success in this comedy series.",TV Comedies,,,1,
38,s39,TV Show,แผนร้ายนายเจ้าเล่ห์,,"Chutavuth Pattarakampol, Sheranut Yusananda, Nichaphat Chatchaipholrat, Thassapak Hsu",,"March 30, 2019",2016,TV-14,1 Season,"International TV Shows, Romantic TV Shows, TV Comedies","When two brothers fall for two sisters, they quickly realize the age differences between them are too big to ignore.",International TV Shows,Romantic TV Shows,TV Comedies,1,
45,s46,TV Show,Şubat,,"Alican Yücesoy, Melisa Sözen, Musa Uzunlar, Serkan Ercan, Özkan Uğur, Ülkü Duru, Tansu Biçer, Nadir Sarıbacak, Sermet Yeşil, Ayhan Kavas",Turkey,"January 17, 2017",2013,TV-MA,1 Season,"Crime TV Shows, International TV Shows, TV Dramas","An orphan subjected to tests that gave him superpowers is rescued and raised on Istanbul's streets, where he falls for a reporter linked to his past.",Crime TV Shows,International TV Shows,TV Dramas,1,


In [58]:
movies.drop(["Seasons"], axis=1, inplace=True)

In [60]:
# Splitting just the number from the seasons 
movies["Seasons"] = movies[movies["type"]=="TV Show"]["duration"].apply(lambda x: pd.Series(str(x).split(sep=" ")))[0]

In [50]:
movies["Movie length"] = movies[movies["type"]=="Movie"]["duration"].apply(lambda x: pd.Series(str(x).split(sep=" ")))[0]

In [61]:
movies.head()

Unnamed: 0,show_id,type,title,director,cast,country,date_added,release_year,rating,duration,listed_in,description,Cat1,Cat2,Cat3,Movie length,Seasons
0,s1,TV Show,3%,,"João Miguel, Bianca Comparato, Michel Gomes, Rodolfo Valente, Vaneza Oliveira, Rafael Lozano, Viviane Porto, Mel Fronckowiak, Sergio Mamberti, Zezé Motta, Celso Frateschi",Brazil,"August 14, 2020",2020,TV-MA,4 Seasons,"International TV Shows, TV Dramas, TV Sci-Fi & Fantasy","In a future where the elite inhabit an island paradise far from the crowded slums, you get one chance to join the 3% saved from squalor.",International TV Shows,TV Dramas,TV Sci-Fi & Fantasy,,4.0
1,s2,Movie,7:19,Jorge Michel Grau,"Demián Bichir, Héctor Bonilla, Oscar Serrano, Azalia Ortiz, Octavio Michel, Carmen Beato",Mexico,"December 23, 2016",2016,TV-MA,93 min,"Dramas, International Movies","After a devastating earthquake hits Mexico City, trapped survivors from all walks of life wait to be rescued while trying desperately to stay alive.",Dramas,International Movies,,93.0,
2,s3,Movie,23:59,Gilbert Chan,"Tedd Chan, Stella Chung, Henley Hii, Lawrence Koh, Tommy Kuan, Josh Lai, Mark Lee, Susan Leong, Benjamin Lim",Singapore,"December 20, 2018",2011,R,78 min,"Horror Movies, International Movies","When an army recruit is found dead, his fellow soldiers are forced to confront a terrifying secret that's haunting their jungle island training camp.",Horror Movies,International Movies,,78.0,
3,s4,Movie,9,Shane Acker,"Elijah Wood, John C. Reilly, Jennifer Connelly, Christopher Plummer, Crispin Glover, Martin Landau, Fred Tatasciore, Alan Oppenheimer, Tom Kane",United States,"November 16, 2017",2009,PG-13,80 min,"Action & Adventure, Independent Movies, Sci-Fi & Fantasy","In a postapocalyptic world, rag-doll robots hide in fear from dangerous machines out to exterminate them, until a brave newcomer joins the group.",Action & Adventure,Independent Movies,Sci-Fi & Fantasy,80.0,
4,s5,Movie,21,Robert Luketic,"Jim Sturgess, Kevin Spacey, Kate Bosworth, Aaron Yoo, Liza Lapira, Jacob Pitts, Laurence Fishburne, Jack McGee, Josh Gad, Sam Golzari, Helen Carey, Jack Gilpin",United States,"January 1, 2020",2008,PG-13,123 min,Dramas,A brilliant group of students become card-counting experts with the intent of swindling millions out of Las Vegas casinos by playing blackjack.,Dramas,,,123.0,


In [23]:
movies['description'].unique()

array([ 'In a future where the elite inhabit an island paradise far from the crowded slums, you get one chance to join the 3% saved from squalor.',
       'After a devastating earthquake hits Mexico City, trapped survivors from all walks of life wait to be rescued while trying desperately to stay alive.',
       "When an army recruit is found dead, his fellow soldiers are forced to confront a terrifying secret that's haunting their jungle island training camp.",
       ...,
       "In this documentary, South African rapper Nasty C hits the stage and streets of Tokyo, introducing himself to the city's sights, sounds and culture.",
       'Dessert wizard Adriano Zumbo looks for the next “Willy Wonka” in this tense competition that finds skilled amateurs competing for a $100,000 prize.',
       'This documentary delves into the mystique behind the blues-rock trio and explores how the enigmatic band created their iconic look and sound.'], dtype=object)

In [24]:
movies['duration'].unique()

array(['4 Seasons', '93 min', '78 min', '80 min', '123 min', '1 Season',
       '95 min', '119 min', '118 min', '143 min', '103 min', '89 min',
       '91 min', '149 min', '144 min', '124 min', '87 min', '110 min',
       '128 min', '117 min', '100 min', '2 Seasons', '84 min', '99 min',
       '90 min', '102 min', '104 min', '105 min', '56 min', '125 min',
       '81 min', '97 min', '106 min', '107 min', '109 min', '44 min',
       '75 min', '101 min', '3 Seasons', '37 min', '113 min', '114 min',
       '130 min', '94 min', '140 min', '135 min', '82 min', '70 min',
       '121 min', '92 min', '164 min', '53 min', '83 min', '116 min',
       '86 min', '120 min', '96 min', '126 min', '129 min', '77 min',
       '137 min', '148 min', '28 min', '122 min', '176 min', '85 min',
       '22 min', '68 min', '111 min', '29 min', '142 min', '168 min',
       '21 min', '59 min', '20 min', '98 min', '108 min', '76 min',
       '26 min', '156 min', '30 min', '57 min', '150 min', '133 min',
       '1