### Import Required Libraries and Set Up Environment Variables

In [44]:
# Dependencies
import requests
import time
from dotenv import load_dotenv
import os
import pandas as pd
import json

In [45]:
# Set environment variables from the .env in the local environment
load_dotenv()

nyt_api_key = os.getenv("NYT_API_KEYS")
tmdb_api_key = os.getenv("TMDB_API_KEYS")

Python-dotenv could not parse statement starting at line 9


### Access the New York Times API

In [46]:
# Set the base URL
url = "https://api.nytimes.com/svc/search/v2/articlesearch.json?"

# Filter for movie reviews with "love" in the headline
# section_name should be "Movies"
# type_of_material should be "Review"
filter_query = 'section_name:"Movies" AND type_of_material:"Review" AND headline:"love"'

# Use a sort filter, sort by newest
sort = "newest"

# Select the following fields to return:
# headline, web_url, snippet, source, keywords, pub_date, byline, word_count
field_list = "headline,web_url,snippet,source,keywords,pub_date,byline,word_count"

# Search for reviews published between a begin and end date
begin_date = "20130101"
end_date = "20230531"

# Build URL
movie_query = (f"{url}api-key={nyt_api_key}&begin_date={begin_date}&end_date={end_date}"
    + f'&fq={filter_query}&sort={sort}&fl={field_list}')
movie_query



'https://api.nytimes.com/svc/search/v2/articlesearch.json?api-key=cVZLtBsbtxvlgIjekA34XK0ukImrhDYI&begin_date=20130101&end_date=20230531&fq=section_name:"Movies" AND type_of_material:"Review" AND headline:"love"&sort=newest&fl=headline,web_url,snippet,source,keywords,pub_date,byline,word_count'

In [47]:
# Create an empty list to store the reviews
nyt_movie_list = []

# loop through pages 0-19

for page in range(20):

    # create query with a page number
    # API results show 10 articles at a time
    nyt_movie_page = movie_query + "&page=" + str(page)
    
    # Make a "GET" request and retrieve the JSON
    nyt_results = requests.get(nyt_movie_page).json()

    # Add a twelve second interval between queries to stay within API query limits
    time.sleep(12)

    # Try and save the reviews to the reviews_list
    try:
        nyt_reviews = requests.get(nyt_movie_page).json()

        # loop through the reviews["response"]["docs"] and append each review to the list
        for movie in nyt_reviews["response"]["docs"]:
            nyt_movie_list.append(movie)

        # Print the page that was just retrieved
        print("page " + str(page))

    except Exception as e:       

        # Print the page number that had no results then break from the loop
         print("page " + str(page) + " Not Found")
         break


page 0
page 1
page 2
page 3 Not Found


In [48]:
# Preview the first 5 results in JSON format
# Use json.dumps with argument indent=4 to format data

print(json.dumps(nyt_movie_list[:5], indent=4))

[
    {
        "web_url": "https://www.nytimes.com/2023/05/25/movies/the-attachment-diaries-review.html",
        "snippet": "A gynecologist and her patient form a horrifyingly twisted connection in this batty, bloody Argentine melodrama.",
        "source": "The New York Times",
        "headline": {
            "main": "\u2018The Attachment Diaries\u2019 Review: Love, Sick",
            "kicker": null,
            "content_kicker": null,
            "print_headline": "The Attachment Diaries",
            "name": null,
            "seo": null,
            "sub": null
        },
        "keywords": [
            {
                "name": "subject",
                "value": "Movies",
                "rank": 1,
                "major": "N"
            },
            {
                "name": "creative_works",
                "value": "The Attachment Diaries (Movie)",
                "rank": 2,
                "major": "N"
            },
            {
                "name": "persons",
 

In [49]:
# Convert reviews_list to a Pandas DataFrame using json_normalize()
nyt_movie_list_df = pd.json_normalize(nyt_movie_list)
nyt_movie_list_df

Unnamed: 0,web_url,snippet,source,keywords,pub_date,word_count,headline.main,headline.kicker,headline.content_kicker,headline.print_headline,headline.name,headline.seo,headline.sub,byline.original,byline.person,byline.organization
0,https://www.nytimes.com/2023/05/25/movies/the-...,A gynecologist and her patient form a horrifyi...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-05-25T11:00:03+0000,295,"‘The Attachment Diaries’ Review: Love, Sick",,,The Attachment Diaries,,,,By Jeannette Catsoulis,"[{'firstname': 'Jeannette', 'middlename': None...",
1,https://www.nytimes.com/2023/05/04/movies/what...,Two childhood friends navigate cultural differ...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-05-04T17:16:45+0000,287,Review: ‘What’s Love Got to Do With It?’ Proba...,,,What’s Love Got to Do With It?,,,,By Jeannette Catsoulis,"[{'firstname': 'Jeannette', 'middlename': None...",
2,https://www.nytimes.com/2023/05/04/movies/you-...,Religion comes between two girls falling in lo...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-05-04T11:00:08+0000,294,‘You Can Live Forever’ Review: Do You Love Me ...,,,You Can Live Forever,,,,By Elisabeth Vincentelli,"[{'firstname': 'Elisabeth', 'middlename': None...",
3,https://www.nytimes.com/2023/04/21/movies/a-to...,Rachael Leigh Cook stars in this bland rom-com...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-04-21T07:03:25+0000,276,‘A Tourist’s Guide to Love’ Review: A Wearying...,,,A Tourist’s Guide to Love,,,,By Elisabeth Vincentelli,"[{'firstname': 'Elisabeth', 'middlename': None...",
4,https://www.nytimes.com/2023/04/20/movies/othe...,A radiant Virginie Efira stars as a Parisian t...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-04-20T15:35:13+0000,801,‘Other People’s Children’ Review: True Romance,Critic’s pick,,Intoxicating Love With a Sobering Turn,,,,By Manohla Dargis,"[{'firstname': 'Manohla', 'middlename': None, ...",
5,https://www.nytimes.com/2023/04/13/movies/one-...,A film adaptation of Taylor Jenkins Reid’s nov...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-04-13T11:00:06+0000,320,‘One True Loves’ Review: A Romance Lost at Sea,,,One True Loves,,,,By Brandon Yu,"[{'firstname': 'Brandon', 'middlename': None, ...",
6,https://www.nytimes.com/2023/04/13/movies/the-...,There’s not much Lennon music heard in this do...,The New York Times,"[{'name': 'subject', 'value': 'Documentary Fil...",2023-04-13T11:00:03+0000,327,‘The Lost Weekend: A Love Story’ Review: When ...,,,The Lost Weekend: A Love Story,,,,By Glenn Kenny,"[{'firstname': 'Glenn', 'middlename': None, 'l...",
7,https://www.nytimes.com/2023/03/30/movies/a-th...,A mesmerizing Teyana Taylor stars in A.V. Rock...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-03-30T18:53:42+0000,971,‘A Thousand and One’ Review: A New York Love S...,Critic’s Pick,,An Unbending Will Meets a Shifting City,,,,By Manohla Dargis,"[{'firstname': 'Manohla', 'middlename': None, ...",
8,https://www.nytimes.com/2023/02/09/movies/your...,This humdrum Netflix romantic comedy features ...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-02-10T00:00:05+0000,569,‘Your Place or Mine’ Review: Try Neither,,,They Have a Humdrum Kind of Love,,,,By Amy Nicholson,"[{'firstname': 'Amy', 'middlename': None, 'las...",
9,https://www.nytimes.com/2023/02/02/movies/love...,"To combat the overdose crisis, a group that in...",The New York Times,"[{'name': 'subject', 'value': 'Documentary Fil...",2023-02-02T12:00:11+0000,306,‘Love in the Time of Fentanyl’ Review: Heartbr...,,,Love in the Time Of Fentanyl,,,,By Concepción de León,"[{'firstname': 'Concepción', 'middlename': Non...",


In [50]:
# Extract the title from the "headline.main" column and
# save it to a new column "title"
# Title is between unicode characters \u2018 and \u2019. 
# End string should include " Review" to avoid cutting title early

movie_title_df = nyt_movie_list_df.copy()

movie_title_df['title'] = movie_title_df['headline.main'].apply(lambda x: x[x.find('\u2018') + 1 : x.find('\u2019 Review')] if x.find('\u2018') != -1 and x.find('\u2019 Review') != -1 else None)

movie_title_df



Unnamed: 0,web_url,snippet,source,keywords,pub_date,word_count,headline.main,headline.kicker,headline.content_kicker,headline.print_headline,headline.name,headline.seo,headline.sub,byline.original,byline.person,byline.organization,title
0,https://www.nytimes.com/2023/05/25/movies/the-...,A gynecologist and her patient form a horrifyi...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-05-25T11:00:03+0000,295,"‘The Attachment Diaries’ Review: Love, Sick",,,The Attachment Diaries,,,,By Jeannette Catsoulis,"[{'firstname': 'Jeannette', 'middlename': None...",,The Attachment Diaries
1,https://www.nytimes.com/2023/05/04/movies/what...,Two childhood friends navigate cultural differ...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-05-04T17:16:45+0000,287,Review: ‘What’s Love Got to Do With It?’ Proba...,,,What’s Love Got to Do With It?,,,,By Jeannette Catsoulis,"[{'firstname': 'Jeannette', 'middlename': None...",,
2,https://www.nytimes.com/2023/05/04/movies/you-...,Religion comes between two girls falling in lo...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-05-04T11:00:08+0000,294,‘You Can Live Forever’ Review: Do You Love Me ...,,,You Can Live Forever,,,,By Elisabeth Vincentelli,"[{'firstname': 'Elisabeth', 'middlename': None...",,You Can Live Forever
3,https://www.nytimes.com/2023/04/21/movies/a-to...,Rachael Leigh Cook stars in this bland rom-com...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-04-21T07:03:25+0000,276,‘A Tourist’s Guide to Love’ Review: A Wearying...,,,A Tourist’s Guide to Love,,,,By Elisabeth Vincentelli,"[{'firstname': 'Elisabeth', 'middlename': None...",,A Tourist’s Guide to Love
4,https://www.nytimes.com/2023/04/20/movies/othe...,A radiant Virginie Efira stars as a Parisian t...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-04-20T15:35:13+0000,801,‘Other People’s Children’ Review: True Romance,Critic’s pick,,Intoxicating Love With a Sobering Turn,,,,By Manohla Dargis,"[{'firstname': 'Manohla', 'middlename': None, ...",,Other People’s Children
5,https://www.nytimes.com/2023/04/13/movies/one-...,A film adaptation of Taylor Jenkins Reid’s nov...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-04-13T11:00:06+0000,320,‘One True Loves’ Review: A Romance Lost at Sea,,,One True Loves,,,,By Brandon Yu,"[{'firstname': 'Brandon', 'middlename': None, ...",,One True Loves
6,https://www.nytimes.com/2023/04/13/movies/the-...,There’s not much Lennon music heard in this do...,The New York Times,"[{'name': 'subject', 'value': 'Documentary Fil...",2023-04-13T11:00:03+0000,327,‘The Lost Weekend: A Love Story’ Review: When ...,,,The Lost Weekend: A Love Story,,,,By Glenn Kenny,"[{'firstname': 'Glenn', 'middlename': None, 'l...",,The Lost Weekend: A Love Story
7,https://www.nytimes.com/2023/03/30/movies/a-th...,A mesmerizing Teyana Taylor stars in A.V. Rock...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-03-30T18:53:42+0000,971,‘A Thousand and One’ Review: A New York Love S...,Critic’s Pick,,An Unbending Will Meets a Shifting City,,,,By Manohla Dargis,"[{'firstname': 'Manohla', 'middlename': None, ...",,A Thousand and One
8,https://www.nytimes.com/2023/02/09/movies/your...,This humdrum Netflix romantic comedy features ...,The New York Times,"[{'name': 'subject', 'value': 'Movies', 'rank'...",2023-02-10T00:00:05+0000,569,‘Your Place or Mine’ Review: Try Neither,,,They Have a Humdrum Kind of Love,,,,By Amy Nicholson,"[{'firstname': 'Amy', 'middlename': None, 'las...",,Your Place or Mine
9,https://www.nytimes.com/2023/02/02/movies/love...,"To combat the overdose crisis, a group that in...",The New York Times,"[{'name': 'subject', 'value': 'Documentary Fil...",2023-02-02T12:00:11+0000,306,‘Love in the Time of Fentanyl’ Review: Heartbr...,,,Love in the Time Of Fentanyl,,,,By Concepción de León,"[{'firstname': 'Concepción', 'middlename': Non...",,Love in the Time of Fentanyl


In [51]:
# Extract 'name' and 'value' from items in "keywords" column
def extract_keywords(keyword_list):
    extracted_keywords = ""
    for item in keyword_list:
        # Extract 'name' and 'value'
        keyword = f"{item['name']}: {item['value']};" 
        # Append the keyword item to the extracted_keywords list
        extracted_keywords += keyword
    return extracted_keywords

# Fix the "keywords" column by converting cells from a list to a string
keyword_df = movie_title_df.copy()

keyword_df['keywords'] = keyword_df['keywords'].apply(lambda x: extract_keywords(x))

keyword_df


Unnamed: 0,web_url,snippet,source,keywords,pub_date,word_count,headline.main,headline.kicker,headline.content_kicker,headline.print_headline,headline.name,headline.seo,headline.sub,byline.original,byline.person,byline.organization,title
0,https://www.nytimes.com/2023/05/25/movies/the-...,A gynecologist and her patient form a horrifyi...,The New York Times,subject: Movies;creative_works: The Attachment...,2023-05-25T11:00:03+0000,295,"‘The Attachment Diaries’ Review: Love, Sick",,,The Attachment Diaries,,,,By Jeannette Catsoulis,"[{'firstname': 'Jeannette', 'middlename': None...",,The Attachment Diaries
1,https://www.nytimes.com/2023/05/04/movies/what...,Two childhood friends navigate cultural differ...,The New York Times,"subject: Movies;persons: Kapur, Shekhar;person...",2023-05-04T17:16:45+0000,287,Review: ‘What’s Love Got to Do With It?’ Proba...,,,What’s Love Got to Do With It?,,,,By Jeannette Catsoulis,"[{'firstname': 'Jeannette', 'middlename': None...",,
2,https://www.nytimes.com/2023/05/04/movies/you-...,Religion comes between two girls falling in lo...,The New York Times,subject: Movies;creative_works: You Can Live F...,2023-05-04T11:00:08+0000,294,‘You Can Live Forever’ Review: Do You Love Me ...,,,You Can Live Forever,,,,By Elisabeth Vincentelli,"[{'firstname': 'Elisabeth', 'middlename': None...",,You Can Live Forever
3,https://www.nytimes.com/2023/04/21/movies/a-to...,Rachael Leigh Cook stars in this bland rom-com...,The New York Times,subject: Movies;creative_works: A Tourist's Gu...,2023-04-21T07:03:25+0000,276,‘A Tourist’s Guide to Love’ Review: A Wearying...,,,A Tourist’s Guide to Love,,,,By Elisabeth Vincentelli,"[{'firstname': 'Elisabeth', 'middlename': None...",,A Tourist’s Guide to Love
4,https://www.nytimes.com/2023/04/20/movies/othe...,A radiant Virginie Efira stars as a Parisian t...,The New York Times,"subject: Movies;persons: Zlotowski, Rebecca;cr...",2023-04-20T15:35:13+0000,801,‘Other People’s Children’ Review: True Romance,Critic’s pick,,Intoxicating Love With a Sobering Turn,,,,By Manohla Dargis,"[{'firstname': 'Manohla', 'middlename': None, ...",,Other People’s Children
5,https://www.nytimes.com/2023/04/13/movies/one-...,A film adaptation of Taylor Jenkins Reid’s nov...,The New York Times,"subject: Movies;persons: Bracey, Luke (1989- )...",2023-04-13T11:00:06+0000,320,‘One True Loves’ Review: A Romance Lost at Sea,,,One True Loves,,,,By Brandon Yu,"[{'firstname': 'Brandon', 'middlename': None, ...",,One True Loves
6,https://www.nytimes.com/2023/04/13/movies/the-...,There’s not much Lennon music heard in this do...,The New York Times,subject: Documentary Films and Programs;creati...,2023-04-13T11:00:03+0000,327,‘The Lost Weekend: A Love Story’ Review: When ...,,,The Lost Weekend: A Love Story,,,,By Glenn Kenny,"[{'firstname': 'Glenn', 'middlename': None, 'l...",,The Lost Weekend: A Love Story
7,https://www.nytimes.com/2023/03/30/movies/a-th...,A mesmerizing Teyana Taylor stars in A.V. Rock...,The New York Times,subject: Movies;creative_works: A Thousand and...,2023-03-30T18:53:42+0000,971,‘A Thousand and One’ Review: A New York Love S...,Critic’s Pick,,An Unbending Will Meets a Shifting City,,,,By Manohla Dargis,"[{'firstname': 'Manohla', 'middlename': None, ...",,A Thousand and One
8,https://www.nytimes.com/2023/02/09/movies/your...,This humdrum Netflix romantic comedy features ...,The New York Times,subject: Movies;creative_works: Your Place or ...,2023-02-10T00:00:05+0000,569,‘Your Place or Mine’ Review: Try Neither,,,They Have a Humdrum Kind of Love,,,,By Amy Nicholson,"[{'firstname': 'Amy', 'middlename': None, 'las...",,Your Place or Mine
9,https://www.nytimes.com/2023/02/02/movies/love...,"To combat the overdose crisis, a group that in...",The New York Times,subject: Documentary Films and Programs;subjec...,2023-02-02T12:00:11+0000,306,‘Love in the Time of Fentanyl’ Review: Heartbr...,,,Love in the Time Of Fentanyl,,,,By Concepción de León,"[{'firstname': 'Concepción', 'middlename': Non...",,Love in the Time of Fentanyl


In [52]:
# Create a list from the "title" column using to_list()
# These titles will be used in the query for The Movie Database

title_list = keyword_df['title'].to_list()
title_list

['The Attachment Diaries',
 None,
 'You Can Live Forever',
 'A Tourist’s Guide to Love',
 'Other People’s Children',
 'One True Loves',
 'The Lost Weekend: A Love Story',
 'A Thousand and One',
 'Your Place or Mine',
 'Love in the Time of Fentanyl',
 'Pamela, a Love Story',
 'In From the Side',
 'After Love',
 'Alcarràs',
 'Nelly & Nadine',
 'Lady Chatterley’s Lover',
 'The Sound of Christmas',
 'The Inspection',
 'Bones and All',
 'My Policeman',
 'About Fate',
 'Waiting for Bojangles',
 'I Love My Dad',
 'A Love Song',
 'Alone Together',
 'Art of Love',
 'The Wheel',
 'Thor: Love and Thunder',
 'Both Sides of the Blade',
 'Fire of Love']

### Access The Movie Database API

In [53]:
# Prepare The Movie Database query
url = "https://api.themoviedb.org/3/search/movie?query="
tmdb_key_string = "&api_key=" + tmdb_api_key

In [54]:
# Create an empty list to store the results

tmdb_movie_list = []

# Create a request counter to sleep the requests after a multiple
# of 50 requests

movie_counter = 1

# Loop through the titles
for tmdb_title in title_list:

    # Check if we need to sleep before making a request
    if movie_counter/50 == int(movie_counter/50):
        time.sleep(12)

    # Add 1 to the request counter
    movie_counter += 1
    
    # Perform a "GET" request for The Movie Database
    
    # Include a try clause to search for the full movie details.
    # Use the except clause to print out a statement if a movie
    # is not found.

    try:

        tmdb_results = requests.get(url + str(tmdb_title) + tmdb_key_string).json()
        
        # Get movie id

        tmdb_movie_id = tmdb_results['results'][0]['id']

        # Make a request for a the full movie details

        movie_detail_url = 'https://api.themoviedb.org/3/movie/' + str(tmdb_movie_id) + '?api_key=' + tmdb_api_key
        # Execute "GET" request with url

        movie_detail_result = requests.get(movie_detail_url).json()
  
        # Extract the genre names into a list

        genre_list = [genre['name'] for genre in movie_detail_result['genres']]

        # Extract the spoken_languages' English name into a list

        spoken_languages_list = [spoken_languages['english_name'] for spoken_languages in movie_detail_result['spoken_languages']]

        # Extract the production_countries' name into a list

        production_countries_list = [production_countries['name'] for production_countries in movie_detail_result['production_countries']]

        # Add the relevant data to a dictionary and
        # append it to the tmdb_movies_list list

        tmdb_movie_data = {}

        tmdb_movie_data.update({'title': movie_detail_result['title']})
        tmdb_movie_data.update({'original_title': movie_detail_result['original_title']})
        tmdb_movie_data.update({'budget': movie_detail_result['budget']})
        tmdb_movie_data.update({'genre': genre_list})
        tmdb_movie_data.update({'language': movie_detail_result['original_language']})
        tmdb_movie_data.update({'spoken_languages': spoken_languages_list})
        tmdb_movie_data.update({'homepage': movie_detail_result['homepage']})
        tmdb_movie_data.update({'popularity': movie_detail_result['popularity']})
        tmdb_movie_data.update({'runtime': movie_detail_result['runtime']})
        tmdb_movie_data.update({'revenue': movie_detail_result['revenue']})
        tmdb_movie_data.update({'release_date': movie_detail_result['release_date']})
        tmdb_movie_data.update({'vote_average': movie_detail_result['vote_average']})
        tmdb_movie_data.update({'vote_count': movie_detail_result['vote_count']})
        tmdb_movie_data.update({'production_countries': production_countries_list})
        tmdb_movie_data.update({'production_companies': movie_detail_result['production_companies']})

        tmdb_movie_list.append(tmdb_movie_data)

        # Print out the title that was found
        print(movie_detail_result['title'])
    
    except Exception as e:
        print(str(tmdb_title) + ' not found')
        



The Attachment Diaries
Red Light Green Light
You Can Live Forever
A Tourist's Guide to Love
Other People's Children
One True Loves
The Lost Weekend: A Love Story
A Thousand and One
Your Place or Mine
Love in the Time of Fentanyl
Pamela, A Love Story
In from the Side
After Love
Alcarràs
Nelly and Monsieur Arnaud
Lady Chatterley's Lover
The Sound of Christmas
The Inspection
Bones and All
My Policeman
About Fate
Waiting for Bojangles
I Love My Dad
A Love Song
Alone Together
Art of Love
2099: The Soldier Protocol
Thor: Love and Thunder
Both Sides of the Blade
Fire of Love


In [55]:
# Preview the first 5 results in JSON format
# Use json.dumps with argument indent=4 to format data
print(json.dumps(tmdb_movie_list[:5], indent=4))


[
    {
        "title": "The Attachment Diaries",
        "original_title": "El apego",
        "budget": 0,
        "genre": [
            "Drama",
            "Mystery",
            "Thriller",
            "Horror"
        ],
        "language": "es",
        "spoken_languages": [
            "Spanish"
        ],
        "homepage": "",
        "popularity": 1.287,
        "runtime": 102,
        "revenue": 0,
        "release_date": "2021-10-07",
        "vote_average": 3.0,
        "vote_count": 4,
        "production_countries": [
            "Argentina"
        ],
        "production_companies": []
    },
    {
        "title": "Red Light Green Light",
        "original_title": "None",
        "budget": 0,
        "genre": [
            "Science Fiction",
            "Horror"
        ],
        "language": "en",
        "spoken_languages": [
            "English"
        ],
        "homepage": "",
        "popularity": 0.352,
        "runtime": 75,
        "revenue": 0,
        

In [56]:
# Convert the results to a DataFrame

tmdb_movie_list_df = pd.json_normalize(tmdb_movie_list)
tmdb_movie_list_df




Unnamed: 0,title,original_title,budget,genre,language,spoken_languages,homepage,popularity,runtime,revenue,release_date,vote_average,vote_count,production_countries,production_companies
0,The Attachment Diaries,El apego,0,"[Drama, Mystery, Thriller, Horror]",es,[Spanish],,1.287,102,0,2021-10-07,3.0,4,[Argentina],[]
1,Red Light Green Light,,0,"[Science Fiction, Horror]",en,[English],,0.352,75,0,,0.0,0,[United States of America],"[{'id': 21788, 'logo_path': None, 'name': 'Gre..."
2,You Can Live Forever,You Can Live Forever,0,"[Drama, Romance]",en,"[English, French]",https://gooddeedentertainment.com/you-can-live...,28.402,96,15055,2023-03-24,6.6,37,"[Canada, United States of America]","[{'id': 63971, 'logo_path': '/9U4LhiybfyhDPpzi..."
3,A Tourist's Guide to Love,A Tourist's Guide to Love,0,"[Romance, Comedy]",en,"[English, Vietnamese]",https://www.netflix.com/title/81424906,17.769,96,0,2023-04-21,6.287,162,[United States of America],"[{'id': 48782, 'logo_path': None, 'name': 'Hea..."
4,Other People's Children,Les Enfants des autres,0,"[Drama, Comedy]",fr,"[French, English]",https://www.wildbunch.biz/movie/other-peoples-...,11.05,104,84178,2022-09-21,6.818,190,[France],"[{'id': 7117, 'logo_path': '/mVAjfnm0GI1V6ZHiG..."
5,One True Loves,One True Loves,0,"[Romance, Comedy, Drama]",en,"[English, Spanish]",,10.023,100,37820,2023-04-07,6.5,75,"[Czech Republic, United States of America]","[{'id': 168294, 'logo_path': '/hO9hMQIAUvSEVJH..."
6,The Lost Weekend: A Love Story,The Lost Weekend: A Love Story,0,[Documentary],en,[English],https://thelostweekendmovie.com/,4.287,95,77145,2023-04-13,6.0,2,[United States of America],[]
7,A Thousand and One,A Thousand and One,0,"[Drama, Crime]",en,"[English, Spanish, Portuguese]",https://www.focusfeatures.com/a-thousand-and-one/,15.331,116,3395595,2023-03-31,6.871,89,[United States of America],"[{'id': 99963, 'logo_path': '/wi5JP4jpVBeb9qK9..."
8,Your Place or Mine,Your Place or Mine,0,"[Romance, Comedy]",en,[English],https://www.netflix.com/title/81045831,19.936,109,0,2023-02-10,6.28,710,[United States of America],"[{'id': 105382, 'logo_path': '/b94sYzp4YUqi3Dq..."
9,Love in the Time of Fentanyl,Love in the Time of Fentanyl,0,[Documentary],en,[English],,0.64,85,0,2023-02-03,0.0,0,"[Canada, United States of America]","[{'id': 10943, 'logo_path': '/9jd9RFYraPpPCz7r..."


### Merge and Clean the Data for Export

In [57]:
# Merge the New York Times reviews and TMDB DataFrames on title

nyt_tmdb_df = pd.merge(tmdb_movie_list_df, movie_title_df, on='title', how='inner')
nyt_tmdb_df




Unnamed: 0,title,original_title,budget,genre,language,spoken_languages,homepage,popularity,runtime,revenue,...,headline.main,headline.kicker,headline.content_kicker,headline.print_headline,headline.name,headline.seo,headline.sub,byline.original,byline.person,byline.organization
0,The Attachment Diaries,El apego,0,"[Drama, Mystery, Thriller, Horror]",es,[Spanish],,1.287,102,0,...,"‘The Attachment Diaries’ Review: Love, Sick",,,The Attachment Diaries,,,,By Jeannette Catsoulis,"[{'firstname': 'Jeannette', 'middlename': None...",
1,You Can Live Forever,You Can Live Forever,0,"[Drama, Romance]",en,"[English, French]",https://gooddeedentertainment.com/you-can-live...,28.402,96,15055,...,‘You Can Live Forever’ Review: Do You Love Me ...,,,You Can Live Forever,,,,By Elisabeth Vincentelli,"[{'firstname': 'Elisabeth', 'middlename': None...",
2,One True Loves,One True Loves,0,"[Romance, Comedy, Drama]",en,"[English, Spanish]",,10.023,100,37820,...,‘One True Loves’ Review: A Romance Lost at Sea,,,One True Loves,,,,By Brandon Yu,"[{'firstname': 'Brandon', 'middlename': None, ...",
3,The Lost Weekend: A Love Story,The Lost Weekend: A Love Story,0,[Documentary],en,[English],https://thelostweekendmovie.com/,4.287,95,77145,...,‘The Lost Weekend: A Love Story’ Review: When ...,,,The Lost Weekend: A Love Story,,,,By Glenn Kenny,"[{'firstname': 'Glenn', 'middlename': None, 'l...",
4,A Thousand and One,A Thousand and One,0,"[Drama, Crime]",en,"[English, Spanish, Portuguese]",https://www.focusfeatures.com/a-thousand-and-one/,15.331,116,3395595,...,‘A Thousand and One’ Review: A New York Love S...,Critic’s Pick,,An Unbending Will Meets a Shifting City,,,,By Manohla Dargis,"[{'firstname': 'Manohla', 'middlename': None, ...",
5,Your Place or Mine,Your Place or Mine,0,"[Romance, Comedy]",en,[English],https://www.netflix.com/title/81045831,19.936,109,0,...,‘Your Place or Mine’ Review: Try Neither,,,They Have a Humdrum Kind of Love,,,,By Amy Nicholson,"[{'firstname': 'Amy', 'middlename': None, 'las...",
6,Love in the Time of Fentanyl,Love in the Time of Fentanyl,0,[Documentary],en,[English],,0.64,85,0,...,‘Love in the Time of Fentanyl’ Review: Heartbr...,,,Love in the Time Of Fentanyl,,,,By Concepción de León,"[{'firstname': 'Concepción', 'middlename': Non...",
7,After Love,After Love,0,[Drama],en,"[English, Arabic, French, Urdu]",,7.059,89,0,...,‘After Love’ Review: The Other Woman,Critic’s Pick,,After Love,,,,By Beatrice Loayza,"[{'firstname': 'Beatrice', 'middlename': None,...",
8,Alcarràs,Alcarràs,3,[Drama],ca,[Catalan],https://www.alcarras-film.com/,10.042,120,2,...,‘Alcarràs’ Review: Labor of Love,,,Alcarràs,,,,By Devika Girish,"[{'firstname': 'Devika', 'middlename': None, '...",
9,The Sound of Christmas,The Sound of Christmas,0,"[TV Movie, Drama]",en,[English],,1.613,0,0,...,‘The Sound of Christmas’ Review: A Gospel Sing...,,,The Sound Of Christmas,,,,By Concepción de León,"[{'firstname': 'Concepción', 'middlename': Non...",


In [60]:
# Remove list brackets and quotation marks on the columns containing lists

nyt_tmdb_clean_file_df = nyt_tmdb_df.copy()


# Create a list of the columns that need fixing
def column_contains_lists(col):
    return col.apply(lambda x: isinstance(x, list)).any()

columns_to_fix = [col for col in nyt_tmdb_clean_file_df.columns if column_contains_lists(nyt_tmdb_clean_file_df[col])]

# Create a list of characters to remove

chars_to_remove = ['[', ']', "'", '"', '{','}',',']

def clean_string(s, chars):
    for char in chars:
        s = s.replace(char, '')
    return s

# Loop through the list of columns to fix

for column in columns_to_fix:
   
    # Convert the column to type 'str'
    # Loop through characters to remove

    nyt_tmdb_clean_file_df[column] = nyt_tmdb_clean_file_df[column].astype(str).apply(lambda x: clean_string(x, chars_to_remove))


# Display the fixed DataFrame

nyt_tmdb_clean_file_df



Unnamed: 0,title,original_title,budget,genre,language,spoken_languages,homepage,popularity,runtime,revenue,...,headline.main,headline.kicker,headline.content_kicker,headline.print_headline,headline.name,headline.seo,headline.sub,byline.original,byline.person,byline.organization
0,The Attachment Diaries,El apego,0,Drama Mystery Thriller Horror,es,Spanish,,1.287,102,0,...,"‘The Attachment Diaries’ Review: Love, Sick",,,The Attachment Diaries,,,,By Jeannette Catsoulis,firstname: Jeannette middlename: None lastname...,
1,You Can Live Forever,You Can Live Forever,0,Drama Romance,en,English French,https://gooddeedentertainment.com/you-can-live...,28.402,96,15055,...,‘You Can Live Forever’ Review: Do You Love Me ...,,,You Can Live Forever,,,,By Elisabeth Vincentelli,firstname: Elisabeth middlename: None lastname...,
2,One True Loves,One True Loves,0,Romance Comedy Drama,en,English Spanish,,10.023,100,37820,...,‘One True Loves’ Review: A Romance Lost at Sea,,,One True Loves,,,,By Brandon Yu,firstname: Brandon middlename: None lastname: ...,
3,The Lost Weekend: A Love Story,The Lost Weekend: A Love Story,0,Documentary,en,English,https://thelostweekendmovie.com/,4.287,95,77145,...,‘The Lost Weekend: A Love Story’ Review: When ...,,,The Lost Weekend: A Love Story,,,,By Glenn Kenny,firstname: Glenn middlename: None lastname: Ke...,
4,A Thousand and One,A Thousand and One,0,Drama Crime,en,English Spanish Portuguese,https://www.focusfeatures.com/a-thousand-and-one/,15.331,116,3395595,...,‘A Thousand and One’ Review: A New York Love S...,Critic’s Pick,,An Unbending Will Meets a Shifting City,,,,By Manohla Dargis,firstname: Manohla middlename: None lastname: ...,
5,Your Place or Mine,Your Place or Mine,0,Romance Comedy,en,English,https://www.netflix.com/title/81045831,19.936,109,0,...,‘Your Place or Mine’ Review: Try Neither,,,They Have a Humdrum Kind of Love,,,,By Amy Nicholson,firstname: Amy middlename: None lastname: Nich...,
6,Love in the Time of Fentanyl,Love in the Time of Fentanyl,0,Documentary,en,English,,0.64,85,0,...,‘Love in the Time of Fentanyl’ Review: Heartbr...,,,Love in the Time Of Fentanyl,,,,By Concepción de León,firstname: Concepción middlename: None lastnam...,
7,After Love,After Love,0,Drama,en,English Arabic French Urdu,,7.059,89,0,...,‘After Love’ Review: The Other Woman,Critic’s Pick,,After Love,,,,By Beatrice Loayza,firstname: Beatrice middlename: None lastname:...,
8,Alcarràs,Alcarràs,3,Drama,ca,Catalan,https://www.alcarras-film.com/,10.042,120,2,...,‘Alcarràs’ Review: Labor of Love,,,Alcarràs,,,,By Devika Girish,firstname: Devika middlename: None lastname: G...,
9,The Sound of Christmas,The Sound of Christmas,0,TV Movie Drama,en,English,,1.613,0,0,...,‘The Sound of Christmas’ Review: A Gospel Sing...,,,The Sound Of Christmas,,,,By Concepción de León,firstname: Concepción middlename: None lastnam...,


In [61]:
# Drop "byline.person" column
nyt_tmdb_clean_file_df = nyt_tmdb_clean_file_df.drop(columns=['byline.person'])
nyt_tmdb_clean_file_df

Unnamed: 0,title,original_title,budget,genre,language,spoken_languages,homepage,popularity,runtime,revenue,...,word_count,headline.main,headline.kicker,headline.content_kicker,headline.print_headline,headline.name,headline.seo,headline.sub,byline.original,byline.organization
0,The Attachment Diaries,El apego,0,Drama Mystery Thriller Horror,es,Spanish,,1.287,102,0,...,295,"‘The Attachment Diaries’ Review: Love, Sick",,,The Attachment Diaries,,,,By Jeannette Catsoulis,
1,You Can Live Forever,You Can Live Forever,0,Drama Romance,en,English French,https://gooddeedentertainment.com/you-can-live...,28.402,96,15055,...,294,‘You Can Live Forever’ Review: Do You Love Me ...,,,You Can Live Forever,,,,By Elisabeth Vincentelli,
2,One True Loves,One True Loves,0,Romance Comedy Drama,en,English Spanish,,10.023,100,37820,...,320,‘One True Loves’ Review: A Romance Lost at Sea,,,One True Loves,,,,By Brandon Yu,
3,The Lost Weekend: A Love Story,The Lost Weekend: A Love Story,0,Documentary,en,English,https://thelostweekendmovie.com/,4.287,95,77145,...,327,‘The Lost Weekend: A Love Story’ Review: When ...,,,The Lost Weekend: A Love Story,,,,By Glenn Kenny,
4,A Thousand and One,A Thousand and One,0,Drama Crime,en,English Spanish Portuguese,https://www.focusfeatures.com/a-thousand-and-one/,15.331,116,3395595,...,971,‘A Thousand and One’ Review: A New York Love S...,Critic’s Pick,,An Unbending Will Meets a Shifting City,,,,By Manohla Dargis,
5,Your Place or Mine,Your Place or Mine,0,Romance Comedy,en,English,https://www.netflix.com/title/81045831,19.936,109,0,...,569,‘Your Place or Mine’ Review: Try Neither,,,They Have a Humdrum Kind of Love,,,,By Amy Nicholson,
6,Love in the Time of Fentanyl,Love in the Time of Fentanyl,0,Documentary,en,English,,0.64,85,0,...,306,‘Love in the Time of Fentanyl’ Review: Heartbr...,,,Love in the Time Of Fentanyl,,,,By Concepción de León,
7,After Love,After Love,0,Drama,en,English Arabic French Urdu,,7.059,89,0,...,359,‘After Love’ Review: The Other Woman,Critic’s Pick,,After Love,,,,By Beatrice Loayza,
8,Alcarràs,Alcarràs,3,Drama,ca,Catalan,https://www.alcarras-film.com/,10.042,120,2,...,306,‘Alcarràs’ Review: Labor of Love,,,Alcarràs,,,,By Devika Girish,
9,The Sound of Christmas,The Sound of Christmas,0,TV Movie Drama,en,English,,1.613,0,0,...,277,‘The Sound of Christmas’ Review: A Gospel Sing...,,,The Sound Of Christmas,,,,By Concepción de León,


In [62]:
# Delete duplicate rows and reset index

nyt_tmdb_clean_file_df = nyt_tmdb_clean_file_df.drop_duplicates().reset_index()
nyt_tmdb_clean_file_df




Unnamed: 0,index,title,original_title,budget,genre,language,spoken_languages,homepage,popularity,runtime,...,word_count,headline.main,headline.kicker,headline.content_kicker,headline.print_headline,headline.name,headline.seo,headline.sub,byline.original,byline.organization
0,0,The Attachment Diaries,El apego,0,Drama Mystery Thriller Horror,es,Spanish,,1.287,102,...,295,"‘The Attachment Diaries’ Review: Love, Sick",,,The Attachment Diaries,,,,By Jeannette Catsoulis,
1,1,You Can Live Forever,You Can Live Forever,0,Drama Romance,en,English French,https://gooddeedentertainment.com/you-can-live...,28.402,96,...,294,‘You Can Live Forever’ Review: Do You Love Me ...,,,You Can Live Forever,,,,By Elisabeth Vincentelli,
2,2,One True Loves,One True Loves,0,Romance Comedy Drama,en,English Spanish,,10.023,100,...,320,‘One True Loves’ Review: A Romance Lost at Sea,,,One True Loves,,,,By Brandon Yu,
3,3,The Lost Weekend: A Love Story,The Lost Weekend: A Love Story,0,Documentary,en,English,https://thelostweekendmovie.com/,4.287,95,...,327,‘The Lost Weekend: A Love Story’ Review: When ...,,,The Lost Weekend: A Love Story,,,,By Glenn Kenny,
4,4,A Thousand and One,A Thousand and One,0,Drama Crime,en,English Spanish Portuguese,https://www.focusfeatures.com/a-thousand-and-one/,15.331,116,...,971,‘A Thousand and One’ Review: A New York Love S...,Critic’s Pick,,An Unbending Will Meets a Shifting City,,,,By Manohla Dargis,
5,5,Your Place or Mine,Your Place or Mine,0,Romance Comedy,en,English,https://www.netflix.com/title/81045831,19.936,109,...,569,‘Your Place or Mine’ Review: Try Neither,,,They Have a Humdrum Kind of Love,,,,By Amy Nicholson,
6,6,Love in the Time of Fentanyl,Love in the Time of Fentanyl,0,Documentary,en,English,,0.64,85,...,306,‘Love in the Time of Fentanyl’ Review: Heartbr...,,,Love in the Time Of Fentanyl,,,,By Concepción de León,
7,7,After Love,After Love,0,Drama,en,English Arabic French Urdu,,7.059,89,...,359,‘After Love’ Review: The Other Woman,Critic’s Pick,,After Love,,,,By Beatrice Loayza,
8,8,Alcarràs,Alcarràs,3,Drama,ca,Catalan,https://www.alcarras-film.com/,10.042,120,...,306,‘Alcarràs’ Review: Labor of Love,,,Alcarràs,,,,By Devika Girish,
9,9,The Sound of Christmas,The Sound of Christmas,0,TV Movie Drama,en,English,,1.613,0,...,277,‘The Sound of Christmas’ Review: A Gospel Sing...,,,The Sound Of Christmas,,,,By Concepción de León,


In [64]:
# Export data to CSV without the index

nyt_tmdb_clean_file_df.to_csv('nyt_tmdb_movies.csv', index=False)
