In [1]:
import pandas as pd
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import cosine_similarity
# Sample academy dataset
theatre_data = {
 "names": [
    "Vetri Cinemas",
    "INOX Vishaal De Mall",
    "Jazz Cinemas",
    "Ambiga Cinemas",
    "CinePriya Cinemas",
    "Mani Impala Theatre",
    "Balaganesh Theatre",
    "Tamil Jaya Cinemas",
    "Simmakkal New Theatre",
    "Meenakshi Cinemas"
  ],
  "descriptions": [
    "A popular theatre known for its high-quality visuals and sound, providing a great movie experience.",
    "A premium multiplex with modern seating, excellent sound, and a comfortable ambience.",
    "A well-maintained cinema offering a high-definition movie experience with superior sound quality.",
    "A well-established theatre, popular among locals for its affordability and good movie screening.",
    "A budget-friendly theatre with good seating arrangements and decent sound quality.",
    "One of the oldest and most renowned theatres in Madurai, known for its large screen and traditional charm.",
    "A comfortable cinema hall with good projection and sound systems, attracting a loyal audience.",
    "A well-known theatre screening mostly Tamil movies, providing an enjoyable experience for regional cinema lovers.",
    "A popular choice for watching both mainstream and regional movies with a decent sound system.",
    "A simple yet comfortable theatre offering an affordable and good movie-watching experience."
  ]
}

In [2]:
# Create a DataFrame
theatre_df = pd.DataFrame(theatre_data)
print(theatre_df)

                   names                                       descriptions
0          Vetri Cinemas  A popular theatre known for its high-quality v...
1   INOX Vishaal De Mall  A premium multiplex with modern seating, excel...
2           Jazz Cinemas  A well-maintained cinema offering a high-defin...
3         Ambiga Cinemas  A well-established theatre, popular among loca...
4      CinePriya Cinemas  A budget-friendly theatre with good seating ar...
5    Mani Impala Theatre  One of the oldest and most renowned theatres i...
6     Balaganesh Theatre  A comfortable cinema hall with good projection...
7     Tamil Jaya Cinemas  A well-known theatre screening mostly Tamil mo...
8  Simmakkal New Theatre  A popular choice for watching both mainstream ...
9      Meenakshi Cinemas  A simple yet comfortable theatre offering an a...


In [4]:
def get_content_based_recommendations(theatre_name, theatre_df, n_recommendations=3):

    tfidf = TfidfVectorizer(stop_words='english')
    tfidf_matrix = tfidf.fit_transform(theatre_df['descriptions'])
    #Find similarity
    cosine_sim = cosine_similarity(tfidf_matrix, tfidf_matrix)

    cosine_sim_df = pd.DataFrame(cosine_sim, index=theatre_df['names'], columns=theatre_df['names'])

    sim_scores = cosine_sim_df[theatre_name].sort_values(ascending=False)
    similar_theatre = sim_scores[sim_scores.index != theatre_name].head(n_recommendations)
    return similar_theatre

In [7]:
theatre_to_recommend = 'Tamil Jaya Cinemas'
recommendations = get_content_based_recommendations(theatre_to_recommend, theatre_df)
print(f"Recommendations for '{theatre_to_recommend}':")
print(recommendations)

Recommendations for 'Tamil Jaya Cinemas':
names
Vetri Cinemas            0.287705
Simmakkal New Theatre    0.216338
Ambiga Cinemas           0.164267
Name: Tamil Jaya Cinemas, dtype: float64
