<a href="https://colab.research.google.com/github/Prithiksha-V/hackton/blob/main/hackton.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
import pandas as pd
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import cosine_similarity

# Load the dataset (ensure movies.csv exists)
movies = pd.read_csv('movies.csv')
movies = movies[['title', 'genre']]  # Selecting only title and genres columns

# Preprocess genres by replacing "|" with spaces
movies['genre'] = movies['genre'].str.replace('|', ' ')

# Convert genres into numerical features using TF-IDF
vectorizer = TfidfVectorizer(stop_words='english')
genre_matrix = vectorizer.fit_transform(movies['genre'])

# Compute similarity between movies
similarity_matrix = cosine_similarity(genre_matrix)

# Function to recommend movies
def recommend_movie(movie_title, movies, similarity_matrix):
    if movie_title not in movies['title'].values:
        return "Movie not found in dataset."

    idx = movies.index[movies['title'] == movie_title][0]
    similar_movies = list(enumerate(similarity_matrix[idx]))
    sorted_movies = sorted(similar_movies, key=lambda x: x[1], reverse=True)[1:6]  # Get top 5 recommendations

    recommendations = [movies.iloc[i[0]]['title'] for i in sorted_movies]
    return recommendations

# Example usage
movie_to_search = "Inception"
recommended_movies = recommend_movie(movie_to_search, movies, similarity_matrix)
print(f"Movies similar to '{movie_to_search}': {recommended_movies}")

Movies similar to 'Inception': ['Interstellar', 'Avatar', 'Guardians of the Galaxy', 'Blade Runner', 'Star Wars: A New Hope']
