In [16]:
#A partir del fichero netflix_titles.csv
#Calcula el número de filas en el fichero, el de series y el de películas.

import pandas as pd
import numpy as np


datos = pd.read_csv("./data/netflix_titles.csv", sep=",")

n_movies = (datos.type == "Movie").sum()
n_shows = (datos.type == "TV Show").sum()

print(f"Movies: {n_movies}, Shows: {n_shows}")


#Calcula el porcentaje de series y películas sobre el total de títulos.


n_titles = len(datos.title.unique())

porcentaje_movies = (n_movies / n_titles) * 100
porcentaje_shows = (n_shows / n_titles) * 100

print(f"Porcentaje movies: {porcentaje_movies}, Porcentaje shows: {porcentaje_shows}")


#Cuenta el número de directores diferentes que aparecen en el fichero.

n_directores = len(datos.director.unique())
print(f"Número de directores diferentes: {n_directores}")

#Añade una nueva columna, "peliLarga", con valor 1 para las películas de más de 120 minutos y 0 en otro caso.
peliLarga = [1 if x > 120 else 0 for x in datos[datos.type == "Movie"].duration.map(lambda d: float(str(d).split(" ")[0]))]

datos["peliLarga"] = pd.Series(peliLarga)

#Crea un nuevo fichero csv, solo con películas, ordenadas por año de aparición, la más reciente primero.(
#pandas.DataFrame.to_csv y https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.sort_values.html)

datos_order_by_relase = datos.sort_values(by=['release_year'])

datos_order_by_relase.head(100)

#Crea un nuevo dataframe solo con las películas listadas como documentales lanzadas ("release_year") en 2020.

datos_relase_2020 = datos[datos["release_year"] == 2020]

datos_relase_2020.head()


#Elimina de este dataframe la columna la columna "cast". https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.drop.html

datos_without_cast = datos.drop(columns=["cast"])

datos_without_cast.head()


#Cambia los nombres de todas las columnas a una versión en español. https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.rename.html


datos.rename(columns={"show_id":"Id_show","type":"tipo","title":"titulo","country":"pais","date_added":"fecha_añadida","release_year":"ano_lanzado"})




#datos.head()


Movies: 6131, Shows: 2676
Porcentaje movies: 69.61507891449983, Porcentaje shows: 30.38492108550017
Número de directores diferentes: 4529


Unnamed: 0,Id_show,tipo,titulo,director,cast,pais,fecha_añadida,ano_lanzado,rating,duration,listed_in,description,peliLarga
0,s1,Movie,Dick Johnson Is Dead,Kirsten Johnson,,United States,"September 25, 2021",2020,PG-13,90 min,Documentaries,"As her father nears the end of his life, filmm...",0.0
1,s2,TV Show,Blood & Water,,"Ama Qamata, Khosi Ngema, Gail Mabalane, Thaban...",South Africa,"September 24, 2021",2021,TV-MA,2 Seasons,"International TV Shows, TV Dramas, TV Mysteries","After crossing paths at a party, a Cape Town t...",0.0
2,s3,TV Show,Ganglands,Julien Leclercq,"Sami Bouajila, Tracy Gotoas, Samuel Jouy, Nabi...",,"September 24, 2021",2021,TV-MA,1 Season,"Crime TV Shows, International TV Shows, TV Act...",To protect his family from a powerful drug lor...,1.0
3,s4,TV Show,Jailbirds New Orleans,,,,"September 24, 2021",2021,TV-MA,1 Season,"Docuseries, Reality TV","Feuds, flirtations and toilet talk go down amo...",0.0
4,s5,TV Show,Kota Factory,,"Mayur More, Jitendra Kumar, Ranjan Raj, Alam K...",India,"September 24, 2021",2021,TV-MA,2 Seasons,"International TV Shows, Romantic TV Shows, TV ...",In a city of coaching centers known to train I...,1.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...
8802,s8803,Movie,Zodiac,David Fincher,"Mark Ruffalo, Jake Gyllenhaal, Robert Downey J...",United States,"November 20, 2019",2007,R,158 min,"Cult Movies, Dramas, Thrillers","A political cartoonist, a crime reporter and a...",
8803,s8804,TV Show,Zombie Dumb,,,,"July 1, 2019",2018,TV-Y7,2 Seasons,"Kids' TV, Korean TV Shows, TV Comedies","While living alone in a spooky town, a young g...",
8804,s8805,Movie,Zombieland,Ruben Fleischer,"Jesse Eisenberg, Woody Harrelson, Emma Stone, ...",United States,"November 1, 2019",2009,R,88 min,"Comedies, Horror Movies",Looking to survive in a world taken over by zo...,
8805,s8806,Movie,Zoom,Peter Hewitt,"Tim Allen, Courteney Cox, Chevy Chase, Kate Ma...",United States,"January 11, 2020",2006,PG,88 min,"Children & Family Movies, Comedies","Dragged from civilian life, a former superhero...",
