# Content-Based Movie Recommendation

Dataset Source:

[wikipedia-movie-plots](https://www.kaggle.com/datasets/jrobischon/wikipedia-movie-plots/)

In [2]:
# Import dependencies
import pandas as pd
import numpy as np

from nltk.tokenize import RegexpTokenizer
from nltk.stem import WordNetLemmatizer,PorterStemmer
from nltk.corpus import stopwords

from sklearn.feature_extraction.text import TfidfVectorizer

import warnings
from tqdm.notebook import tqdm

# hide pandas warning messages
warnings.filterwarnings('ignore')

In [3]:
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)

In [4]:
df = pd.read_csv('wiki_movie_plots_deduped.csv')

df.shape

(34886, 8)

In [5]:
from google.colab import drive
drive.mount('/content/drive')

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).


In [6]:
df.sample(4)

Unnamed: 0,Release Year,Title,Origin/Ethnicity,Director,Cast,Genre,Wiki Page,Plot
11465,1990,Mermaids,American,Richard Benjamin,"Cher, Winona Ryder, Bob Hoskins, Michael Schoe...",comedy,https://en.wikipedia.org/wiki/Mermaids_(1990_f...,"The film is narrated by Charlotte Flax, a quir..."
30884,2008,Thiruvannamalai,Tamil,Perarasu,"Arjun Sarja, Pooja Gandhi",action,https://en.wikipedia.org/wiki/Thiruvannamalai_...,Easwaran (Arjun Sarja) is upright and honest y...
19127,1954,The Beachcomber,British,Muriel Box,"Donald Sinden, Glynis Johns",comedy/drama,https://en.wikipedia.org/wiki/The_Beachcomber_...,The new British Resident of the Welcome Island...
2043,1936,Colleen,American,Alfred E. Green,"Dick Powell, Joan Blondell, Hugh Herbert","comedy, musical",https://en.wikipedia.org/wiki/Colleen_(film),"Colleen is the manager of a dress shop named ""..."


In [7]:
# Checking datatypes
df.dtypes

Release Year         int64
Title               object
Origin/Ethnicity    object
Director            object
Cast                object
Genre               object
Wiki Page           object
Plot                object
dtype: object

### PreProcessing

**Converting all datatypes to string**

In [8]:
df.columns

Index(['Release Year', 'Title', 'Origin/Ethnicity', 'Director', 'Cast',
       'Genre', 'Wiki Page', 'Plot'],
      dtype='object')

In [9]:
df =  df.astype(str)

df.dtypes

Release Year        object
Title               object
Origin/Ethnicity    object
Director            object
Cast                object
Genre               object
Wiki Page           object
Plot                object
dtype: object

### Data Cleaning

Action Items:
* Lower-Case the whole data frame
* Director: Removing 'Director:' and 'Cast:'
* Director, Cast: Removing '\r\n', '\n' and '\r'
* Genre: Replacing '/' with Space
* Director, Cast, Genre: Removing 'Uknonwn' and 'Nan'
* Director: Separating Directors and Actors names
* Director, Cast: Checking if the names are separated with ' and ', ' & '
* Director, Cast: Merging the first names and last names together
* Director, Cast: Adding the words of 'Director' and 'Actor' as prefix
* Plot: Removing English Stopwords
* Doc: Removing special characters

In [10]:
df = df.applymap(lambda x: x.lower() if isinstance(x,str) else x)

In [11]:
# Remove prefixes "director:" and "cast:" in the "Director" column
df["Director"] = df["Director"].str.replace("director:", "", regex=False)
df["Director"] = df["Director"].str.replace("cast:", "", regex=False)


# Replace carriage returns and newlines with a space
df["Director"] = df["Director"].str.replace("\r\n", " ", regex=False)
df["Cast"] = df["Cast"].str.replace("\r\n", " ", regex=False)

df["Director"] = df["Director"].str.replace("\n", " ", regex=False)
df["Cast"] = df["Cast"].str.replace("\n", " ", regex=False)


# Replace slashes with spaces in the "Genre" column
df["Genre"] = df["Genre"].str.replace("/", " ", regex=False)


# Remove the word "unknown" in the "Director", "Cast", and "Genre" columns
df["Director"] = df["Director"].str.replace("unknown", "", regex=False)
df["Cast"] = df["Cast"].str.replace("unknown", "", regex=False)
df["Genre"] = df["Genre"].str.replace("unknown", "", regex=False)


# Remove the word "nan" in the "Director", "Cast", and "Genre" columns
df["Director"] = df["Director"].str.replace("nan", "", regex=False)
df["Cast"] = df["Cast"].str.replace("nan", "", regex=False)
df["Genre"] = df["Genre"].str.replace("nan", "", regex=False)


# Replace " and " and " & " with commas in the "Director" and "Cast" columns
df["Director"] = df["Director"].str.replace(" and ", ",", regex=False)
df["Cast"] = df["Cast"].str.replace(" and ", ",", regex=False)
df["Director"] = df["Director"].str.replace(" & ", ",", regex=False)
df["Cast"] = df["Cast"].str.replace(" & ", ",", regex=False)

# Remove all whitespace in the "Director" and "Cast" columns
df["Director"] = df["Director"].str.replace(" ", "", regex=False)
df["Cast"] = df["Cast"].str.replace(" ", "", regex=False)

# Replace commas with spaces in the "Director" and "Cast" columns
df["Director"] = df["Director"].str.replace(",", " ", regex=False)
df["Cast"] = df["Cast"].str.replace(",", " ", regex=False)

In [12]:
# Add 'director' prefix to non-empty "Director" entries
df["Director"] = np.where(df["Director"].str.len() > 0,
                          'director' + df["Director"],
                          df["Director"])

# Add 'actor' prefix to non-empty "Cast" entries
df["Cast"] = np.where(df["Cast"].str.len() > 0,
                      'actor' + df["Cast"],
                      df["Cast"])

# Replace spaces with ' director' in the "Director" column:
df["Director"] = df["Director"].str.replace(" ", " director", regex=False)


# Replace spaces with ' actor' in the "Cast" column
df["Cast"] = df["Cast"].str.replace(" ", " actor", regex=False)

In [13]:
df.sample(5)

Unnamed: 0,Release Year,Title,Origin/Ethnicity,Director,Cast,Genre,Wiki Page,Plot
32353,2008,baladur,telugu,directorudayasankar,actorraviteja actorkrishna actoranushkashetty ...,drama,https://en.wikipedia.org/wiki/baladur,chanti (ravi teja) respects his uncle rama kri...
14513,2004,never die alone,american,directorernestr.dickerson,actordmx actordavidarquette,crime drama,https://en.wikipedia.org/wiki/never_die_alone,hardened criminal and drug dealer king david (...
2700,1939,undercover doctor,american,directorlouisking,actorlloydnolan actorjanicelogan,drama,https://en.wikipedia.org/wiki/undercover_doctor,dr. bartley morgan appears to be a highly resp...
30832,2008,sila nerangalil,tamil,directorjayaraj,actorvincentasokan actornavyanair actorvineeth,thriller,https://en.wikipedia.org/wiki/sila_nerangalil,a murder case that took place in mid sixties i...
4513,1947,magic town,american,directorwilliamwellman,actorjamesstewart actorjanewyman,drama,https://en.wikipedia.org/wiki/magic_town,"lawrence ""rip"" smith (james stewart) is a form..."


### Merging the document

In [14]:
column_weights = {"Release Year": 10,
                  "Title": 1,
                  "Origin/Ethnicity": 5,
                  "Director": 5,
                  "Cast": 1,
                  "Genre": 10,
                  "Plot": 1}

df["doc"] = ""

for col in column_weights.keys():
    df["doc"] += column_weights[col] * (df[col] + ' ')

df.head()

Unnamed: 0,Release Year,Title,Origin/Ethnicity,Director,Cast,Genre,Wiki Page,Plot,doc
0,1901,kansas saloon smashers,american,,,,https://en.wikipedia.org/wiki/kansas_saloon_sm...,"a bartender is working at a saloon, serving dr...",1901 1901 1901 1901 1901 1901 1901 1901 1901 1...
1,1901,love by the light of the moon,american,,,,https://en.wikipedia.org/wiki/love_by_the_ligh...,"the moon, painted with a smiling face hangs ov...",1901 1901 1901 1901 1901 1901 1901 1901 1901 1...
2,1901,the martyred presidents,american,,,,https://en.wikipedia.org/wiki/the_martyred_pre...,"the film, just over a minute long, is composed...",1901 1901 1901 1901 1901 1901 1901 1901 1901 1...
3,1901,"terrible teddy, the grizzly king",american,,,,"https://en.wikipedia.org/wiki/terrible_teddy,_...",lasting just 61 seconds and consisting of two ...,1901 1901 1901 1901 1901 1901 1901 1901 1901 1...
4,1902,jack and the beanstalk,american,directorgeorges.fleming directoredwins.porter,,,https://en.wikipedia.org/wiki/jack_and_the_bea...,the earliest known adaptation of the classic f...,1902 1902 1902 1902 1902 1902 1902 1902 1902 1...


### Removing Special Characters

In [15]:
df["doc"] = df["doc"].str.replace("[^a-z 0-9]+", "", regex=True)

In [16]:
pd.set_option('display.max_colwidth', None)
df[["doc"]].sample(10)

Unnamed: 0,doc
10229,1984 1984 1984 1984 1984 1984 1984 1984 1984 1984 just the way you are american american american american american directordouardmolinaro directordouardmolinaro directordouardmolinaro directordouardmolinaro directordouardmolinaro actorkristymcnichol actormichaelontkean comedy comedy comedy comedy comedy comedy comedy comedy comedy comedy susan is a professional flautist in boston who has been handicapped since childhood and is forced to wear a leg brace to get around she is all set to enter into a lavender marriage with her gay investment banker friend frank in order to help him hide his sexuality so he can get ahead in business and get a big promotion but decides not to when she realizes that the marriage wont meet her or his sexual needs shortly afterwards she accepts the offer to travel to europe on a concert tour while in paris she comes up with an idea to disguise her leg by putting it in a cast and travel on her own to the french alps to be treated without pity not looking to find romance susan however has become the interest of peter a news photographer they soon fall in love and peter dumps his insufferable and narcissistic girlfriend bobbie for her susan is forced to decide if she should tell peter the truth about herself
12394,1995 1995 1995 1995 1995 1995 1995 1995 1995 1995 catherine the great american american american american american directormarvinjchomsky directorjohngoldsmith directormarvinjchomsky directorjohngoldsmith directormarvinjchomsky directorjohngoldsmith directormarvinjchomsky directorjohngoldsmith directormarvinjchomsky directorjohngoldsmith actorcatherinezetajones actorjeannemoreau biography biography biography biography biography biography biography biography biography biography a young german princess catherine zetajones gets married to the immature future czar peter iii hannes jaenicke she gradually becomes a skillful politician and rises to become catherine the great
34373,1992 1992 1992 1992 1992 1992 1992 1992 1992 1992 madame aema 7 southkorean southkorean southkorean southkorean southkorean directorsukdowon directorsukdowon directorsukdowon directorsukdowon directorsukdowon actorkangseungmi in this episode in the longrunning madame aema series aema leaves her selfish middleaged husband to pursue a career as an actress she meets a performance artist who persuades her to perform perverted sex acts in the name of art finally repenting of her decision she returns to her husband1
3413,1942 1942 1942 1942 1942 1942 1942 1942 1942 1942 road to happiness american american american american american directorphilrosen directorphilrosen directorphilrosen directorphilrosen directorphilrosen actorjohnboles actormonabarrie drama drama drama drama drama drama drama drama drama drama a bittersweet story of a familys road to happiness jeff carter john boles has just returned from europe eager to see his family charley grady roscoe karns his agent informs jeff that his wife millie mona barrie has divorced him and has remarried to a millionaire sam rankin jeff has discovered that his narcissistic ex has sent danny to military boarding school because she would rather socialize with her friendsdanny is glad his father is home from his twoyear baritone opera studies and is happy to live with him again although they share one room in a boarding house jeff and danny have no money and jeff cannot find a singing job he finds a radio job with an acting part as an indian on a cowboy showdanny realizes he is in the way of his fathers dream to sing and tries to push him away but admits to his father that he cant lie to him his father insists on continuing to act so that they can spend more time togetherjeff gets his long awaited chance
21246,2012 2012 2012 2012 2012 2012 2012 2012 2012 2012 dredd british british british british british directorpetetravis directorpetetravis directorpetetravis directorpetetravis directorpetetravis actordirectorpetetraviscastkarlurban actoroliviathirlby actorwoodharris actorlenaheadey the future united states is a dystopic irradiated wasteland known as the cursed earth on the east coast lies megacity one a violent metropolis with 800 million residents and 17000 crimes reported daily the only force for order are the judges who act as judge jury and executioner judge dredd is tasked by the chief judge with evaluating new recruit cassandra anderson a powerful psychic who failed the aptitude tests to become a judgein peach trees a 200storey slum tower block drug lord madeline madrigal also known as mama executes three rogue drug dealers by having them skinned alive infused with slomo an addictive new drug which reduces the users perception of time to 1 of normal and thrown down the atrium from the top floor dredd and anderson are sent in to investigate and learn of a drug den which they raid they arrest a thug named kay whom andersons mind probe reveals to be the one who carried out the drug dealers executions dredd decides to take him in for questioning in response mamas forces seize the towers security control room and seal the building using its blast shields under the pretence of a security test preventing the judges from leaving or summoning helpmama orders dredd and anderson killed forcing the judges to fight their way through dozens of armed thugs arriving at the 76th floor the judges are assaulted by mama and her men with vulcan cannons that rip through the walls killing numerous residents the judges breach an outer wall and call for backup meanwhile mama sends her henchman caleb to search for the judges when they meet dredd throws caleb off the tower in full view of mamadredd suspects mama is desperate to keep kay quiet and beats him for information anderson reads kays mind and learns that peach trees is the centre of slomo production and distribution anderson suggests they hide while awaiting assistance but dredd insists they move up the tower and pursue mama judges volt and guthrie respond to dredds call but mamas computer expert denies them entry by persuading them the security system is malfunctioning a pair of armed teens confront dredd and anderson allowing kay to disarm and overpower anderson kay then escapes with her as hostage and takes her to mamas base on the top floorwhile dredd works his way towards mama she calls in the corrupt judges lex kaplan chan and alvarez the four relieve volt and guthrie from duty and are allowed into the building dredd encounters chan and is suspicious that he does not ask about andersons status seeing his cover blown chan attacks dredd but is killed meanwhile kay tries to execute anderson with her own weapon but the pistols dna scanner does not recognise him and explodes taking his arm off she escapes and later encounters kaplan whom she promptly kills after reading kaplans mind elsewhere dredd kills alvarez but runs out of ammunition and is shot by lex in the abdomen lex moves in to execute dredd but dredd stalls him long enough for anderson to arrive and kill lexanderson and dredd obtain the code to mamas apartment from her computer expert and confront her mama tells dredd that in the case of her death a device on her wrist will detonate explosives on the top floors destroying the building dredd reasons that the detonators signal will not reach the explosives from the ground floor so he forces mama to inhale slomo and throws her down the atrium to her deathin the aftermath anderson accepts that she has failed her evaluation by getting disarmed and leaves the chief judge asks dredd about andersons performance he responds that she has passed
24429,1956 1956 1956 1956 1956 1956 1956 1956 1956 1956 chori chori bollywood bollywood bollywood bollywood bollywood directoratthakur directoratthakur directoratthakur directoratthakur directoratthakur actorrajkapoor actornargis actorpran actorjohnnywalker actorgope actorbhagwan actorrajasulochana romantic comedy romantic comedy romantic comedy romantic comedy romantic comedy romantic comedy romantic comedy romantic comedy romantic comedy romantic comedy kammo nargis lives a very wealthy lifestyle with her widowed multimillionaire dad girhdarilal gope who would like her to get married to someone who is not after their wealth to his dismay she chooses to marry a pilot named sumankumar pran who is known for womanizing and for his greed when he disapproves she runs away he advertises for her safe return and offers to pay rs125 lakh to the finderfour days later kammo returns and she is not the same anymore she is more humble sober and respectful fully appreciative of this girdharilal agrees to her marriage to sumankumar just before the marriage a man named sagar raj kapoor approaches them this visit will change their lives forever
25521,1989 1989 1989 1989 1989 1989 1989 1989 1989 1989 hum intezaar karenge bollywood bollywood bollywood bollywood bollywood hum intezaar karenge is an action drama featuring mithun chakraborty and padmini kolhapure in lead roles well supported by vinod mehra jagdeep shakti kapoor vinod mehra and shafi inamdar
8192,1967 1967 1967 1967 1967 1967 1967 1967 1967 1967 common law cabin american american american american american directorrussmeyer directorrussmeyer directorrussmeyer directorrussmeyer directorrussmeyer actoralainacapri actoradelerein comedy comedy comedy comedy comedy comedy comedy comedy comedy comedy dewey hoople jack moran runs a broken down tourist trap along the colorado river along with his french wife babette babette bardot and his daughter coral adele rein business is so bad that hoople must pay a local alcoholic frank bolger as cracker to entice tourists called suckers to spend some time and money there
12679,1996 1996 1996 1996 1996 1996 1996 1996 1996 1996 the english patient american american american american american directoranthonyminghella directoranthonyminghella directoranthonyminghella directoranthonyminghella directoranthonyminghella actorralphfiennes actorkristinscottthomas actorjuliettebinoche actorwillemdafoe drama drama drama drama drama drama drama drama drama drama in the final days of the italian campaign of world war ii hana a frenchcanadian nurse working and living in a bombedout italian monastery looks after a critically burned man who speaks english but cannot remember his name they are joined by kip a sikh sapper in the british army who defuses bombs and has a love affair with hana before leaving for florence and david caravaggio a canadian intelligence corps operative who was questioned by germans and has had his thumbs cut off during a german interrogation caravaggio questions the patient who gradually reveals his pastthe patient tells hana and caravaggio that in the late 1930s he was exploring the desert of libya he is revealed to be hungarian cartographer count lszl de almsy who was mapping the sahara as part of a royal geographical society archeological and surveying expedition in egypt and libya with englishman peter madox and others their expedition is joined by a british couple geoffrey and katharine clifton almsy falls in love with katharine and writes about her in his book which katharine reads the two thereafter begin an affair which eventually katharine ends almsy declares that he has found the cave of swimmers an archaeological survey is conducted on it and the surrounding area until they are stopped due to the onset of the war madox leaves his tiger moth plane at kufra oasis before his intended return to britainwhile almsy is packing up their base camp geoffrey in attempted murdersuicide after apparently deducing almsy and katharine were in an affair deliberately crashes the plane narrowly missing almsy geoffrey is killed instantly and katharine is seriously injured almsy carries her to the cave of swimmers leaving her with provisions and begins a threeday walk to get help at britishheld el tag he attempts to explain the situation but is detained as a possible german spy and transported on a train he escapes from the train and trades the geographical society maps to the germans for gasoline he finds madoxs tiger moth and flies back to the cave but katharine has died as he flies himself and katharines body away they are shot down by german antiaircraft guns almsy is badly burned and is rescued by the bedouinafter he has related the story almsy indicates to hana that he wants a lethal dose of morphine she complies and reads katharines final journal entries to him as he dies she and caravaggio leave the monastery for florence
2618,1939 1939 1939 1939 1939 1939 1939 1939 1939 1939 the magnificent fraud american american american american american directorrobertflorey directorrobertflorey directorrobertflorey directorrobertflorey directorrobertflorey actorakimtamiroff actorpatriciamorison comedy comedy comedy comedy comedy comedy comedy comedy comedy comedy akim tamiroff plays an actor performing in a nameless latin american country who is pressed into service when the president is fatally injured by a bomb impersonating the president the actor balances the pleasures and temptations of office dangerous palace intrigue and his duty to the people of the countrythe plot is identical to the 1988 richard dreyfuss film moon over parador both are based on a short story by charles g booth called caviar for his excellencyparts of the film were shot in balboa park in san diego


### Removing Stopwords

In [17]:
import nltk
nltk.download('stopwords')
nltk.download('wordnet')

[nltk_data] Downloading package stopwords to /root/nltk_data...
[nltk_data]   Package stopwords is already up-to-date!
[nltk_data] Downloading package wordnet to /root/nltk_data...
[nltk_data]   Package wordnet is already up-to-date!


True

In [18]:
stops = stopwords.words('english')
print(stops)

['i', 'me', 'my', 'myself', 'we', 'our', 'ours', 'ourselves', 'you', "you're", "you've", "you'll", "you'd", 'your', 'yours', 'yourself', 'yourselves', 'he', 'him', 'his', 'himself', 'she', "she's", 'her', 'hers', 'herself', 'it', "it's", 'its', 'itself', 'they', 'them', 'their', 'theirs', 'themselves', 'what', 'which', 'who', 'whom', 'this', 'that', "that'll", 'these', 'those', 'am', 'is', 'are', 'was', 'were', 'be', 'been', 'being', 'have', 'has', 'had', 'having', 'do', 'does', 'did', 'doing', 'a', 'an', 'the', 'and', 'but', 'if', 'or', 'because', 'as', 'until', 'while', 'of', 'at', 'by', 'for', 'with', 'about', 'against', 'between', 'into', 'through', 'during', 'before', 'after', 'above', 'below', 'to', 'from', 'up', 'down', 'in', 'out', 'on', 'off', 'over', 'under', 'again', 'further', 'then', 'once', 'here', 'there', 'when', 'where', 'why', 'how', 'all', 'any', 'both', 'each', 'few', 'more', 'most', 'other', 'some', 'such', 'no', 'nor', 'not', 'only', 'own', 'same', 'so', 'than', '

In [19]:
lemmatizer = WordNetLemmatizer()
stemmer = PorterStemmer()

def preprocess(sentence):
    tokenizer = RegexpTokenizer(r'\w+')
    tokens = tokenizer.tokenize(sentence)

    # Filters out tokens that are shorter than 3 characters and tokens that are in the list of stopwords
    filtered_words = [w for w in tokens if len(w) > 2 if not w in stopwords.words('english')]

    # Applies the PorterStemmer to each filtered word to reduce it to its stem
    stem_words=[stemmer.stem(w) for w in filtered_words]

    # Applies the WordNetLemmatizer to each stemmed word to reduce it to its base form.
    lemma_words=[lemmatizer.lemmatize(w) for w in stem_words]

    # Joins the lemmatized words back into a single string, separated by spaces.
    return " ".join(lemma_words)

df['doc_clean'] = df['doc'].map(lambda s:preprocess(s))

In [20]:
df[["doc", 'doc_clean']].sample(10)

Unnamed: 0,doc,doc_clean
29207,1959 1959 1959 1959 1959 1959 1959 1959 1959 1959 vaazha vaitha deivam tamil tamil tamil tamil tamil directormathirumugam directormathirumugam directormathirumugam directormathirumugam directormathirumugam actorgeminiganesan actorbsarojadevi actortsbalaiah actorsvsubbaiah actorkuladheivamvrrajagopal actortsmuthaiah actorsandowmmachinnappathevar actorrajabahadhoor actorpkannamba actorgsakunthala actork actormalathi actortpmuthulakshmi the story rather complicated is set against a rural backdrop it is about two families with certain individuals who create misunderstandings between them a young man and a women from the two families fall in love and undergo tribulations which include kidnapping and attempts to murder the mother is a unifying force who has her own struggles before she brings all of them together in a happy ending1,1959 1959 1959 1959 1959 1959 1959 1959 1959 1959 vaazha vaitha deivam tamil tamil tamil tamil tamil directormathirumugam directormathirumugam directormathirumugam directormathirumugam directormathirumugam actorgeminiganesan actorbsarojadevi actortsbalaiah actorsvsubbaiah actorkuladheivamvrrajagop actortsmuthaiah actorsandowmmachinnappathevar actorrajabahadhoor actorpkannamba actorgsakunthala actork actormalathi actortpmuthulakshmi stori rather complic set rural backdrop two famili certain individu creat misunderstand young man woman two famili fall love undergo tribul includ kidnap attempt murder mother unifi forc struggl bring togeth happi ending1
90,1914 1914 1914 1914 1914 1914 1914 1914 1914 1914 making a living american american american american american directorhenrylehrman directorhenrylehrman directorhenrylehrman directorhenrylehrman directorhenrylehrman actorcharliechaplin actorvirginiakirtley actoralicedavenport comedy comedy comedy comedy comedy comedy comedy comedy comedy comedy chaplins character attempts to convince a passerby director henry lehrman to give him money chaplin is then shown flirting with a woman and proposes to her which she accepts lehrman enters to present the woman with flowers and a ring which the woman refuses citing shes engaged lerhman sees chaplin and a slapstick fight between the two ensues later lehrmans character takes a photograph of an automobile accident chaplins character steals the camera whilst the journalist is helping a trapped motorist and rushes back to the paper with it to claim the photograph as his own a short pursuit with the keystone kops follows2,1914 1914 1914 1914 1914 1914 1914 1914 1914 1914 make live american american american american american directorhenrylehrman directorhenrylehrman directorhenrylehrman directorhenrylehrman directorhenrylehrman actorcharliechaplin actorvirginiakirtley actoralicedavenport comedi comedi comedi comedi comedi comedi comedi comedi comedi comedi chaplin charact attempt convinc passerbi director henri lehrman give money chaplin shown flirt woman propos accept lehrman enter present woman flower ring woman refus cite she engag lerhman see chaplin slapstick fight two ensu later lehrman charact take photograph automobil accid chaplin charact steal camera whilst journalist help trap motorist rush back paper claim photograph short pursuit keyston kop follows2
31858,1986 1986 1986 1986 1986 1986 1986 1986 1986 1986 veta telugu telugu telugu telugu telugu directorakodandaramireddy directorakodandaramireddy directorakodandaramireddy directorakodandaramireddy directorakodandaramireddy actorchiranjeevi actorjayapradha actorsumalatha actorjaggayya chiranjeevi is a sailor working on a ship during the british rule of india he is in love with a wealthy woman jayaprada jayapradas cousin who works for the british army also wants to marry her when the captain of the ship csrao is poisoned and killed jayapradas cousin uses his power to put chiru away for good at the secluded andaman jail chiru is trapped in this nightmare that lasts for thirteen years haunted by the baffling course his life has taken over time everything he ever believed about right and wrong is abandoned and replaced by allconsuming thoughts of vengeance against those who betrayed him with the help of an equally innocent fellow inmate jaggaiah who was once a jamindar that opposed the british only to lose his wealth wife and daughter sumalatha chiru plots and succeeds in his mission to escape from prison whereupon he transforms himself into the mysterious and wealthy jamindar he finds the daughter of jaggayya and shelters her with him with cunning ruthlessness he cleverly insinuates himself into the highclass nobility and systematically destroys the men who manipulated and enslaved him,1986 1986 1986 1986 1986 1986 1986 1986 1986 1986 veta telugu telugu telugu telugu telugu directorakodandaramireddi directorakodandaramireddi directorakodandaramireddi directorakodandaramireddi directorakodandaramireddi actorchiranjeevi actorjayapradha actorsumalatha actorjaggayya chiranjeevi sailor work ship british rule india love wealthi woman jayaprada jayaprada cousin work british armi also want marri captain ship csrao poison kill jayaprada cousin use power put chiru away good seclud andaman jail chiru trap nightmar last thirteen year haunt baffl cours life taken time everyth ever believ right wrong abandon replac allconsum thought vengeanc betray help equal innoc fellow inmat jaggaiah jamindar oppos british lose wealth wife daughter sumalatha chiru plot succe mission escap prison whereupon transform mysteri wealthi jamindar find daughter jaggayya shelter cun ruthless cleverli insinu highclass nobil systemat destroy men manipul enslav
28406,2013 2013 2013 2013 2013 2013 2013 2013 2013 2013 zachariayude garbhinikal malayalam malayalam malayalam malayalam malayalam directoraneeshanvar directoraneeshanvar directoraneeshanvar directoraneeshanvar directoraneeshanvar actorlal actorrimakallingal actorsanusha comedy comedy comedy comedy comedy comedy comedy comedy comedy comedy the film narrates the incidents in the life of a gynaecologist and five women who come into his life each with unconventionalillegitimate pregnancies lal acts as the gynaecologist and asha sharreth does the role of doctors wife sanusha plays the role of an eighteenyearold girl who refuses to abort her child and reveal the childs father in the end she gives her baby to the gynaecologist and his wife who dont have children of their own after some months she visits the doctors house and leaves him a book and from reading one of the story in the book that she specially marked he figures out that she bore the child of her father rimas character is a nurse while geetha plays an elderly woman who gets pregnant through artificial insemination7 aju varghese appears as ajmal who has strong feelings for fatima however due to their height difference he is unable to confide his love for her sandra thomas plays the role of another expectant woman who bears her boyfriends child which she wants to conceive only if her husband dies and joy mathew acts as her husband6,2013 2013 2013 2013 2013 2013 2013 2013 2013 2013 zachariayud garbhinik malayalam malayalam malayalam malayalam malayalam directoraneeshanvar directoraneeshanvar directoraneeshanvar directoraneeshanvar directoraneeshanvar actorl actorrimakalling actorsanusha comedi comedi comedi comedi comedi comedi comedi comedi comedi comedi film narrat incid life gynaecologist five woman come life unconventionalillegitim pregnanc lal act gynaecologist asha sharreth role doctor wife sanusha play role eighteenyearold girl refus abort child reveal child father end give babi gynaecologist wife dont child month visit doctor hous leav book read one stori book special mark figur bore child father rima charact nurs geetha play elderli woman get pregnant artifici insemination7 aju varghes appear ajmal strong feel fatima howev due height differ unabl confid love sandra thoma play role anoth expect woman bear boyfriend child want conceiv husband die joy mathew act husband6
27843,2003 2003 2003 2003 2003 2003 2003 2003 2003 2003 war and love malayalam malayalam malayalam malayalam malayalam directorvinayan directorvinayan directorvinayan directorvinayan directorvinayan actordileep actorprabhu the film begins with major rajendran suresh krishna being killed by the pakistani terrorists in the indopak border and the war between india and pakistan begins pakistani army led by general jaffer khan mukesh rishi sends a battalion to capture a village on the indian side of the line of control indian army brigadier nayar captain raju sends the madras regiment to recapture the village madras regiment contains ltcol sharath chandran prabhu captain gopinath dileep major prabhakar saikumar captain kabir siddique captain vijayan vijayaraghavan havildar kurian jagadish private basheer kalabhavan mani naik haneefa havildar prashanthan naik kunjunni machan varghese captain hema indraja and private shankar they recapture the village after a fierce gun battle that kill all the pakistani soldiers but prabhakar and kunjunni die during this battle jaffer khan is angered by this defeat and hatch a plan to capture the entire madrasi regiment alive he calls colonel mushtaq muhammad an isi agent in the indian army and pays him 5 crores rupees for capturing the madras regimentmushtaq muhammad hatch a plan in which all of the madras regiment except gopinath and vijayan were captured gopi kills mushtaq but is captured by the pakistanis all the prisoners of war are sent to a pakistani camp where they get tourtured they are forced to work like slaves kabir haneefa kurian and hema sharaths love interest are killed by the pakis meanwhile notorious pakistani terrorist leader mansoor akthar arrive in the camp jaffer khans daughter beautiful serina laila also arrive there she was about to be raped by mansoor but gopi kills him by dropping a big rock on the terrorists head serina falls in love with gopi while he decides to use it to save his country serina knows malayalam since jaffer khans father migrated from malappuram to pakistan during the partition meanwhile captain vijayan has infiltrated the pak military and gets information that pakistan is going to use nuclear weapons in the wake of a lost war with india gopi with the help of serina gets access to the defusing codes of the missile the climax is fully war between indian pows freed by vijayan and pak armyterrorists finally the nuclear bomb is defused by gopi and entire pak army is killed jaffer khan is killed by sharath who also dies due to injuries entire pak camp is blown up and only gopi serina and vijayan survive the holocaust india wins the war and gopi is given param vir chakra on his return to india gopi marries serina movie ends with serina chanting bharat mata ki jai,2003 2003 2003 2003 2003 2003 2003 2003 2003 2003 war love malayalam malayalam malayalam malayalam malayalam directorvinayan directorvinayan directorvinayan directorvinayan directorvinayan actordileep actorprabhu film begin major rajendran suresh krishna kill pakistani terrorist indopak border war india pakistan begin pakistani armi led gener jaffer khan mukesh rishi send battalion captur villag indian side line control indian armi brigadi nayar captain raju send madra regiment recaptur villag madra regiment contain ltcol sharath chandran prabhu captain gopinath dileep major prabhakar saikumar captain kabir siddiqu captain vijayan vijayaraghavan havildar kurian jagadish privat basheer kalabhavan mani naik haneefa havildar prashanthan naik kunjunni machan varghes captain hema indraja privat shankar recaptur villag fierc gun battl kill pakistani soldier prabhakar kunjunni die battl jaffer khan anger defeat hatch plan captur entir madrasi regiment aliv call colonel mushtaq muhammad isi agent indian armi pay crore rupe captur madra regimentmushtaq muhammad hatch plan madra regiment except gopinath vijayan captur gopi kill mushtaq captur pakistani prison war sent pakistani camp get tourtur forc work like slave kabir haneefa kurian hema sharath love interest kill paki meanwhil notori pakistani terrorist leader mansoor akthar arriv camp jaffer khan daughter beauti serina laila also arriv rape mansoor gopi kill drop big rock terrorist head serina fall love gopi decid use save countri serina know malayalam sinc jaffer khan father migrat malappuram pakistan partit meanwhil captain vijayan infiltr pak militari get inform pakistan go use nuclear weapon wake lost war india gopi help serina get access defus code missil climax fulli war indian pow freed vijayan pak armyterrorist final nuclear bomb defus gopi entir pak armi kill jaffer khan kill sharath also die due injuri entir pak camp blown gopi serina vijayan surviv holocaust india win war gopi given param vir chakra return india gopi marri serina movi end serina chant bharat mata jai
30463,2002 2002 2002 2002 2002 2002 2002 2002 2002 2002 charlie chaplin tamil tamil tamil tamil tamil directorsakthichidambaram directorsakthichidambaram directorsakthichidambaram directorsakthichidambaram directorsakthichidambaram actorprabhu actorprabhudeva actorabhirami actorgayathriraguram ramakrishnan prabhu is a rich businessman in ooty who owns an advertising company and is married to mythili abirami who is very possessive about her husband mythili always suspects her husband fearing that he would end up having an affair with some other girl and this brings frequent quarrels between the couple but ramakrishnan is a kind hearter gentleman and he takes care of his wife with great lovethirunavukkarasu prabhu deva is a poor photographer in the same town and initially ramakrishnan minunderstands thiru to be a rogue later understands his good nature and provides him a job in his own company thiru is very loyal to ramakrishnan and mythili and respects ramakrishnan as his brother ramakrishnan is also very kind to thiru one day thiru meets a girl susi gayathri raghuram and the both fall in love with each other susi is a social activist who voices for women empowermentvishwa livingston is a close friend of ramakrishnan and is married to amudha vindhya but vishwa is a play boy and has affairs with so many girls one day a small quarrel erupts between ramakrishnan and mythili following which ramakrishnan worries thinking about his wifes continuous suspecting behaviour vishwa plans to relax ramakrishnan by engaging a call girl thilothama monalramakrishnan although not interested in it finally decides to spend some time with thiliothama when mythili is away to tirupathi thilothama comes to ramakrishnans guest house where thiru lives suddenly mythili cancels her trip and returns home on the way she finds ramakrishnans car in thirus home and she also comes to thirus home mythili gets shocked to see thilothama and ramakrishnan in thirus home ramakrishnan suddenly manages the situation by lying that thilothama is none other than thirus lover mythili believes this while thiru does not reveal the truth knowing this as it would separate ramakrishnan from his mythilithen it is cat and mouse game where thiru tries to act as thilothamas love in front of mythili at the same time tries hard not to get caught by susi as she is short tempered and hates some lying to her finally mythili and susi get to know about the lies told by thiru and ramakrishnan ramakrishnan and thiru try hard to find thilothama and make her tell all the truth that nothing happened between them but to their surprise thilothama passes away and the two guys have no other proof nowsusi decides to break up with thiru while mythili applies for divorce with ramakrishnan finally in the court ramakrishnan expresses how much he loves mythili and tells all the truth and requests her to believe him also amudha and vishwa convince susi and mythili whereby amudha says that she very well knows about vishwas affair with so many girls but she still lives with a hope of getting him back as a loyal husband some day mythili and susi understand ramakrishnan and thirus good nature and they unite in the end,2002 2002 2002 2002 2002 2002 2002 2002 2002 2002 charli chaplin tamil tamil tamil tamil tamil directorsakthichidambaram directorsakthichidambaram directorsakthichidambaram directorsakthichidambaram directorsakthichidambaram actorprabhu actorprabhudeva actorabhirami actorgayathriraguram ramakrishnan prabhu rich businessman ooti own advertis compani marri mythili abirami posse husband mythili alway suspect husband fear would end affair girl bring frequent quarrel coupl ramakrishnan kind hearter gentleman take care wife great lovethirunavukkarasu prabhu deva poor photograph town initi ramakrishnan minunderstand thiru rogu later understand good natur provid job compani thiru loyal ramakrishnan mythili respect ramakrishnan brother ramakrishnan also kind thiru one day thiru meet girl susi gayathri raghuram fall love susi social activist voic woman empowermentvishwa livingston close friend ramakrishnan marri amudha vindhya vishwa play boy affair mani girl one day small quarrel erupt ramakrishnan mythili follow ramakrishnan worri think wife continu suspect behaviour vishwa plan relax ramakrishnan engag call girl thilothama monalramakrishnan although interest final decid spend time thiliothama mythili away tirupathi thilothama come ramakrishnan guest hous thiru live suddenli mythili cancel trip return home way find ramakrishnan car thiru home also come thiru home mythili get shock see thilothama ramakrishnan thiru home ramakrishnan suddenli manag situat lie thilothama none thiru lover mythili believ thiru reveal truth know would separ ramakrishnan mythilithen cat mous game thiru tri act thilothama love front mythili time tri hard get caught susi short temper hate lie final mythili susi get know lie told thiru ramakrishnan ramakrishnan thiru tri hard find thilothama make tell truth noth happen surpris thilothama pas away two guy proof nowsusi decid break thiru mythili appli divorc ramakrishnan final court ramakrishnan express much love mythili tell truth request believ also amudha vishwa convinc susi mythili wherebi amudha say well know vishwa affair mani girl still live hope get back loyal husband day mythili susi understand ramakrishnan thiru good natur unit end
20137,1972 1972 1972 1972 1972 1972 1972 1972 1972 1972 our miss fred british british british british british directorbobkellett directorbobkellett directorbobkellett directorbobkellett directorbobkellett actordannylarue comedy comedy comedy comedy comedy comedy comedy comedy comedy comedy shakespearean actor fred wimbush is called up during world war ii and is performing in drag entertaining the troops in france when the nazis advance unless he continues his disguise in womens clothes fred fears he will be shot as a spy the double entendres and bullets fly as he attempts his escape in the company of the pupils from an english girls finishing school45,1972 1972 1972 1972 1972 1972 1972 1972 1972 1972 miss fred british british british british british directorbobkellett directorbobkellett directorbobkellett directorbobkellett directorbobkellett actordannylaru comedi comedi comedi comedi comedi comedi comedi comedi comedi comedi shakespearean actor fred wimbush call world war perform drag entertain troop franc nazi advanc unless continu disguis woman cloth fred fear shot spi doubl entendr bullet fli attempt escap compani pupil english girl finish school45
31674,1966 1966 1966 1966 1966 1966 1966 1966 1966 1966 aastiparulu telugu telugu telugu telugu telugu directorvmadhusudanrao directorvmadhusudanrao directorvmadhusudanrao directorvmadhusudanrao directorvmadhusudanrao actorkongarajaggaiah actorakkineninageswararao actorjayalalitha actorgummadi actorgvaralakshmi drama drama drama drama drama drama drama drama drama drama zamindar jannardhan rao gummadi is a rich and wealthy man he has two sons the elder son is krishna akkineni nageswara rao and is good virtuous and devoted to his family and expected to marry radha jayalalitha and younger one is bhaskar baachi jaggayya is a vagabond wayward person having all bad habits while disciplining baachi jannardhan rao has a heart attack and passes away leaving the administration of the estate to krishna this does not auger well with baachi and they attempt to force krishna to sign the estate over to them when they fail they conspire to kill him and take over the estate krishna overhears this and goes along with baachis plan to kill him he then returns as seenu his lookalike in order to set things right things seem to be going well until krishna finds himself in a tight corner when he is accused of killing himself rest of the story is how krishna comes out of the tight loop,1966 1966 1966 1966 1966 1966 1966 1966 1966 1966 aastiparulu telugu telugu telugu telugu telugu directorvmadhusudanrao directorvmadhusudanrao directorvmadhusudanrao directorvmadhusudanrao directorvmadhusudanrao actorkongarajaggaiah actorakkineninageswararao actorjayalalitha actorgummadi actorgvaralakshmi drama drama drama drama drama drama drama drama drama drama zamindar jannardhan rao gummadi rich wealthi man two son elder son krishna akkineni nageswara rao good virtuou devot famili expect marri radha jayalalitha younger one bhaskar baachi jaggayya vagabond wayward person bad habit disciplin baachi jannardhan rao heart attack pas away leav administr estat krishna auger well baachi attempt forc krishna sign estat fail conspir kill take estat krishna overhear goe along baachi plan kill return seenu lookalik order set thing right thing seem go well krishna find tight corner accus kill rest stori krishna come tight loop
30109,1995 1995 1995 1995 1995 1995 1995 1995 1995 1995 puthiya aatchi tamil tamil tamil tamil tamil directorveluprabhakaran directorveluprabhakaran directorveluprabhakaran directorveluprabhakaran directorveluprabhakaran actoradaraj actorraadhika actorradharavi actorsarathbabu marappan anandaraj is the rebel leader of puratchi padai the rebel group only kills corrupted politicians who spoil the poors lives whereas a corrupted politician valluvadasan radha ravi misuses their name and he perpetrates murders of innocent people under their namevivekanandan sarath babu an ips officer lives happily with his wife raadhika and his son vivekanandan is charged to arrest the members of puratchi padai,1995 1995 1995 1995 1995 1995 1995 1995 1995 1995 puthiya aatchi tamil tamil tamil tamil tamil directorveluprabhakaran directorveluprabhakaran directorveluprabhakaran directorveluprabhakaran directorveluprabhakaran actoradaraj actorraadhika actorradharavi actorsarathbabu marappan anandaraj rebel leader puratchi padai rebel group kill corrupt politician spoil poor live wherea corrupt politician valluvadasan radha ravi misus name perpetr murder innoc peopl namevivekanandan sarath babu ip offic live happili wife raadhika son vivekanandan charg arrest member puratchi padai
5688,1952 1952 1952 1952 1952 1952 1952 1952 1952 1952 my pal gus american american american american american directorrobertparrish directorrobertparrish directorrobertparrish directorrobertparrish directorrobertparrish actorrichardwidmark actorjoannedru comedy comedy comedy comedy comedy comedy comedy comedy comedy comedy dave jennings is so focused on his los angelesbased business that he neglects his precocious fiveyearold son gus who is constantly creating havoc in order to get his fathers attention after guss latest escapade is cleaned up and paid for dave orders his longsuffering secretary ivy tolliver to find a new nurse for gus then leaves on a business trip upon his return dave learns that ivy has placed gus in the playtime school and that he must meet with the teacher lydia marble to enroll gus formally rushed as usual dave tells the attractive lydia that he will pay whatever it takes to keep gus in line but when lydia explains that parents are required to participate in their childs education at playtime dave indignantly states that he knows all he needs to about gus dave is amazed by how well gus responds to lydias instructions however after he smacks a schoolmate believing that gus can benefit from lydias tutelage dave agrees to keep him at playtime as the next three weeks pass gus becomes contented and wellbehaved but on daves scheduled parent participation day the businessman instead sends a truckload of toys to the school lydia returns the toys with a note admonishing dave that as a substitute for his attention the toys are not enough and when dave comes to the school to protest lydia assumes that he is there to helpdave tells lydia that he has fallen in love with her and although lydia returns daves affections she tells him that his feelings stem from his dependence upon her for help with gus that night dave comforts a frightened gus by allowing him to sleep in his bed and realizing that he no longer needs lydia for instruction on child care confronts her with his new knowledge secure that dave does indeed love her for herself lydia enjoys his embrace as time passes dave becomes a devoted father and his romance with lydia blossoms into an engagement on guss birthday however joyce daves exwife appears and asks dave to visit her at her hotel fearing the worst dave keeps the appointment and discovers that the moneygrubbing immoral joyce is broke and claims that their mexican divorce is not legal daves lawyer farley norris confirms the upsetting news but dave infuriated by joyces reappearance refuses to give her money to obtain a legal divorcedetermined to win no matter what is revealed about joyce in court dave does not listen to the pleas of his friends that he think of gus and end the confrontation quietly dave instead hires private detectives to gather ammunition against joyce until the day before the trial begins needing a rest dave drives to his new beach house and spends the night unknown to dave lydia and gus have also spent the night there and in court the next day joyces lawyer charges dave with adultery and names lydia as the corespondent the resulting publicity horrifies lydia and she is forced to close her school lydia confronts dave accusing him of caring more about his fortune than about his son and breaks their engagement as the trial continues farley proves that joyce abandoned dave and the judge upholds daves request for a divorce although he does not award joyce any of daves property the judge sickened by daves tactics grants joyce custody of gus dave is heartbroken and on the morning that he drives gus to joyces hotel is overcome when gus pleads to remain with him realizing that gus is more important to him than anything else dave marches to joyces room and agrees to give her everything he owns in exchange for permanent custody of gus as he returns to the car dave is met by lydia who promises to help him fight for his son assuring her that the matter is settled dave embraces lydia and gus then asks lydia if she can pay for lunch,1952 1952 1952 1952 1952 1952 1952 1952 1952 1952 pal gu american american american american american directorrobertparrish directorrobertparrish directorrobertparrish directorrobertparrish directorrobertparrish actorrichardwidmark actorjoannedru comedi comedi comedi comedi comedi comedi comedi comedi comedi comedi dave jen focus lo angelesbas busi neglect precoci fiveyearold son gu constantli creat havoc order get father attent gu latest escapad clean paid dave order longsuff secretari ivi tolliv find new nurs gu leav busi trip upon return dave learn ivi place gu playtim school must meet teacher lydia marbl enrol gu formal rush usual dave tell attract lydia pay whatev take keep gu line lydia explain parent requir particip child educ playtim dave indignantli state know need gu dave amaz well gu respond lydia instruct howev smack schoolmat believ gu benefit lydia tutelag dave agre keep playtim next three week pas gu becom content wellbehav dave schedul parent particip day businessman instead send truckload toy school lydia return toy note admonish dave substitut attent toy enough dave come school protest lydia assum helpdav tell lydia fallen love although lydia return dave affect tell feel stem depend upon help gu night dave comfort frighten gu allow sleep bed realiz longer need lydia instruct child care confront new knowledg secur dave inde love lydia enjoy embrac time pas dave becom devot father romanc lydia blossom engag gu birthday howev joyc dave exwif appear ask dave visit hotel fear worst dave keep appoint discov moneygrub immor joyc broke claim mexican divorc legal dave lawyer farley norri confirm upset news dave infuri joyc reappear refus give money obtain legal divorcedetermin win matter reveal joyc court dave listen plea friend think gu end confront quietli dave instead hire privat detect gather ammunit joyc day trial begin need rest dave drive new beach hous spend night unknown dave lydia gu also spent night court next day joyc lawyer charg dave adulteri name lydia corespond result public horrifi lydia forc close school lydia confront dave accus care fortun son break engag trial continu farley prove joyc abandon dave judg uphold dave request divorc although award joyc dave properti judg sicken dave tactic grant joyc custodi gu dave heartbroken morn drive gu joyc hotel overcom gu plead remain realiz gu import anyth el dave march joyc room agre give everyth own exchang perman custodi gu return car dave met lydia promis help fight son assur matter settl dave embrac lydia gu ask lydia pay lunch


### TF-IDF

In [None]:
vectorizer = TfidfVectorizer()
X = vectorizer.fit_transform(df["doc_clean"])
column_names = vectorizer.get_feature_names_out()

df_tf_idf = pd.DataFrame(X.toarray(), columns=column_names)
df_tf_idf.shape

### Cosine Similarity

In [None]:
df_cos_sim = pd.DataFrame(cosine_similarity(df_tf_idf, dense_output=True))
df_cos_sim.shape

In [None]:
# saving cosine similarity matrix

df_cos_sim.to_parquet("../data/movie_cos_sim.parquet")

### Converting Cosine Similarity Dataframe to Top-K Items

In [None]:
K = 10

df_top_k = pd.DataFrame()
movie_indices = df_cos_sim.columns

for col in tqdm(movie_indices):
    df_test = df_cos_sim[[col]].sort_values(by=[col], ascending=False).head(K+1).copy()

    record = []
    for index, row in df_test.iterrows():
        if index != col:
            item = [int(index), float(row[col])]
            record.append(item)
        if len(record) == K:
            break

    df_top_k[col] = record

df_top_k.shape

In [None]:
# Transpose
df_top_k = df_top_k.T

df_top_k.sample(10)

In [None]:
# saving similarity top-k dataframe

df_top_k.to_parquet("../data/movie_top_k_t.parquet")

### Testing

In [None]:
pd.set_option('display.max_colwidth', 50)

In [None]:
query = 'titanic'

df[df["Title"].str.contains("titanic")]

In [None]:
movie_index = 13153 # Titanic Movie

df_query = df_cos_sim[[movie_index]].sort_values(by=[movie_index]).tail(5)
df_query.shape

In [None]:
df[df.index == 6275]

In [None]:
df[df.index == 16392]