In [1]:

# Internship Domain Recommendation Engine using Content-Based Filtering

import pandas as pd
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import linear_kernel

# Step 1: Internship Domain Data
data = {
    'Domain': [
        'Web Development',
        'Data Science',
        'Cybersecurity',
        'Artificial Intelligence',
        'Cloud Computing',
        'Mobile App Development',
        'Digital Marketing'
    ],
    'Description': [
        'HTML CSS JavaScript Frontend Backend React Node',
        'Python Machine Learning Data Analysis Statistics Pandas',
        'Network Security Hacking Cryptography Risk Management',
        'AI Deep Learning Neural Networks NLP Python',
        'AWS Azure DevOps Cloud Architecture Serverless',
        'Android iOS Flutter Kotlin Swift Mobile Apps',
        'SEO SEM Social Media Analytics Campaigns Branding'
    ]
}

df = pd.DataFrame(data)

# Step 2: Vectorize descriptions
tfidf = TfidfVectorizer(stop_words='english')
tfidf_matrix = tfidf.fit_transform(df['Description'])

# Step 3: Simulated User Input
user_input = "I am interested in Python, Machine Learning, and Data Analysis"
user_vec = tfidf.transform([user_input])

# Step 4: Compute Similarity and Recommend
cosine_sim = linear_kernel(user_vec, tfidf_matrix).flatten()
top_indices = cosine_sim.argsort()[-3:][::-1]
recommendations = df.iloc[top_indices]

# Step 5: Print Recommendations
print("Top Internship Domain Recommendations:")
print(recommendations[['Domain', 'Description']])


Top Internship Domain Recommendations:
                    Domain                                        Description
1             Data Science  Python Machine Learning Data Analysis Statisti...
3  Artificial Intelligence        AI Deep Learning Neural Networks NLP Python
6        Digital Marketing  SEO SEM Social Media Analytics Campaigns Branding
