In [10]:
import pandas as pd
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import cosine_similarity
# Sample academy dataset
academy_data = {
  "names": [
    "V-Stars Academy",
    "Dexter Academy",
    "SEN IAS Academy",
    "Kalvi Higher Education & Research Institute",
    "BroadMind Consultant",
    "Arena Animation",
    "Elysium Academy",
    "Sri Sai Coaching Centre",
    "Kingmakers IAS Academy",
    "Mazenet Solution"
  ],
  "descriptions": [
    "Provides training in computer courses, typewriting, tailoring, and spoken languages with government-approved certifications.",
    "Offers coaching for banking exams, TNPSC, SSC, and railway recruitment with expert faculty.",
    "Specializes in IAS coaching for UPSC Civil Services, along with CAT, MAT, and IBPS PO exam preparation.",
    "A higher education and research institute offering IELTS, GRE, and certification courses in various domains.",
    "A study-abroad consultant providing training for IELTS, PTE, TOEFL, GMAT, and other international entrance exams.",
    "One of the best institutes for animation and multimedia courses, including VFX, gaming, and 3D animation.",
    "A premier institute offering software, networking, and IT certification training in Madurai.",
    "Renowned for NEET and medical entrance exam coaching with a high success rate.",
    "A well-known IAS coaching institute that prepares students for UPSC Prelims, Mains, and Interview stages.",
    "Provides software training, IT certification programs, and corporate training solutions."
  ]
}

In [11]:
# Create a DataFrame
academy_df = pd.DataFrame(academy_data)
print(academy_df)

                                         names  \
0                              V-Stars Academy   
1                               Dexter Academy   
2                              SEN IAS Academy   
3  Kalvi Higher Education & Research Institute   
4                         BroadMind Consultant   
5                              Arena Animation   
6                              Elysium Academy   
7                      Sri Sai Coaching Centre   
8                       Kingmakers IAS Academy   
9                             Mazenet Solution   

                                        descriptions  
0  Provides training in computer courses, typewri...  
1  Offers coaching for banking exams, TNPSC, SSC,...  
2  Specializes in IAS coaching for UPSC Civil Ser...  
3  A higher education and research institute offe...  
4  A study-abroad consultant providing training f...  
5  One of the best institutes for animation and m...  
6  A premier institute offering software, network...  
7  Renown

In [12]:
def get_content_based_recommendations(academy_name, academy_df, n_recommendations=3):

    tfidf = TfidfVectorizer(stop_words='english')
    tfidf_matrix = tfidf.fit_transform(academy_df['descriptions'])
    #Find similarity
    cosine_sim = cosine_similarity(tfidf_matrix, tfidf_matrix)

    cosine_sim_df = pd.DataFrame(cosine_sim, index=academy_df['names'], columns=academy_df['names'])

    sim_scores = cosine_sim_df[academy_name].sort_values(ascending=False)
    similar_academy = sim_scores[sim_scores.index != academy_name].head(n_recommendations)
    return similar_academy

In [13]:
academy_to_recommend = 'Elysium Academy'
recommendations = get_content_based_recommendations(academy_to_recommend, academy_df)
print(f"Recommendations for '{academy_to_recommend}':")
print(recommendations)

Recommendations for 'Elysium Academy':
names
Mazenet Solution                               0.338259
Kalvi Higher Education & Research Institute    0.247681
Kingmakers IAS Academy                         0.073582
Name: Elysium Academy, dtype: float64
