In [1]:
import pandas as pd
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import cosine_similarity
# Sample movie dataset
doctors_data = {
  "names": [
    "Dr. Praveen Kumar C",
    "Dr. Madhusudhanan J",
    "Dr. A.G. Alwar Ramanujam",
    "Dr. Rajesh Prabhu",
    "Dr. A.C. Arun",
    "Dr. M Annamalai Swamy",
    "Dr. Sanjay Nagral",
    "Dr. S Ravi",
    "Dr. Krishna Mohan",
    "Dr. Arulprakash"
  ],
  "descriptions": [
    "Specialist in liver and digestive disorders at Apollo Hospitals, Madurai",
    "Expert in chronic gastrointestinal conditions at Apollo Speciality Hospitals, Madurai",
    "Surgical gastroenterologist specializing in pediatric and adult care",
    "Oncologist with expertise in gastrointestinal cancers",
    "Digestive system disorders specialist at Pandian Advanced Medical Centre, Madurai",
    "Experienced general physician in Madurai",
    "Gastrointestinal surgery and hepatology specialist",
    "Expert in endoscopic retrograde cholangiopancreatography (ERCP)",
    "Renowned gastroenterologist at Meenakshi Mission Hospital",
    "Specialist in hepatology and liver-related disorders"
  ]
}

In [2]:
# Create a DataFrame
doctors_df = pd.DataFrame(doctors_data)
print(doctors_df)

                      names                                       descriptions
0       Dr. Praveen Kumar C  Specialist in liver and digestive disorders at...
1       Dr. Madhusudhanan J  Expert in chronic gastrointestinal conditions ...
2  Dr. A.G. Alwar Ramanujam  Surgical gastroenterologist specializing in pe...
3         Dr. Rajesh Prabhu  Oncologist with expertise in gastrointestinal ...
4             Dr. A.C. Arun  Digestive system disorders specialist at Pandi...
5     Dr. M Annamalai Swamy           Experienced general physician in Madurai
6         Dr. Sanjay Nagral  Gastrointestinal surgery and hepatology specia...
7                Dr. S Ravi  Expert in endoscopic retrograde cholangiopancr...
8         Dr. Krishna Mohan  Renowned gastroenterologist at Meenakshi Missi...
9           Dr. Arulprakash  Specialist in hepatology and liver-related dis...


In [3]:
def get_content_based_recommendations(doctor_name, doctors_df, n_recommendations=3):
    #LEO , ACTION ADVENTURE, 2
    tfidf = TfidfVectorizer(stop_words='english')
    tfidf_matrix = tfidf.fit_transform(doctors_df['descriptions'])
    #ACTION,ADVENTURE,===> ACTION, ADVENTURE
    cosine_sim = cosine_similarity(tfidf_matrix, tfidf_matrix)
    #ACTION=====>RRR,Irumbukottaimurattusingam
    cosine_sim_df = pd.DataFrame(cosine_sim, index=doctors_df['names'], columns=doctors_df['names'])

    sim_scores = cosine_sim_df[doctor_name].sort_values(ascending=False)
    similar_doctors = sim_scores[sim_scores.index != doctor_name].head(n_recommendations)
    return similar_doctors

In [4]:
doctor_to_recommend = 'Dr. Praveen Kumar C'
recommendations = get_content_based_recommendations(doctor_to_recommend, doctors_df)
print(f"Recommendations for '{doctor_to_recommend}':")
print(recommendations)

Recommendations for 'Dr. Praveen Kumar C':
names
Dr. Arulprakash        0.444737
Dr. A.C. Arun          0.417243
Dr. Madhusudhanan J    0.365057
Name: Dr. Praveen Kumar C, dtype: float64
