In [3]:
import pandas as pd
from bs4 import BeautifulSoup
import csv
import requests as req
from collections import Counter

# Keyword categorisation: Disease

In [2]:
#each disease category with lists of key words in lowercase 
infection=[keyword.lower() for keyword in ['Infection','Cholera','Pathogen']]
virus= [keyword.lower() for keyword in ['Dengue','Measles','Rabies','viral','Influenza','Herpes']]
bacteria= [keyword.lower() for keyword in ['Tuberculosis','Syphilis','Leprosy','Antibiotics','Bacteria','Bacterial']]
parasite= [keyword.lower() for keyword in ['Malaria','Protozoa','Helminths','Ectoparasite','Endoparasite','Tapeworm','Giardiasis','Toxoplasmosis','parasite']]
fungal= [keyword.lower() for keyword in ['Fungal','Yeast','Mould','Antifungal']]
aging= [keyword.lower() for keyword in ['Aging','Oxidative']]
cancer= [keyword.lower() for keyword in ['Stem','Oncogenes','Cancer','Tumor','Melanoma','Carcinoma','Chemotherapy','Sarcoma','malignant','gliomas','Aptosis']]
diabetes= [keyword.lower() for keyword in ['Diabetes','Insulin','Diabetic']]
obesity= [keyword.lower() for keyword in ['Obesity','Overweight','Weight']]
cardiovascular= [keyword.lower() for keyword in ['Vascular','Angina','Coronary','Atherosclerosis','Cardiovascular','Heart','Stroke','Hypertension']]
genetic= [keyword.lower() for keyword in ['DNA','Genetic','Cystic Fibrosis','Genetics','Epigenetics','Mutation','Hereditary','Inherited','Sickle','Hemophilia','Dystrophy','MS','Marfan','Wilson','Thalassemia','Tay-Sachs','Duchenne','Hemochromatosis']]
autoimmune= [keyword.lower() for keyword in ['T-cell','Psoriasis','HIV','AIDS','Immune','Autoimmune','Autoimmunity','Allergies','Inflammation','Immunodeficiency','Lupus','Rheumatoid','Crohn\'s','Celiac','Hashimoto\'s','Thyroiditis','Guillain-Barr√©']]
neurological= [keyword.lower() for keyword in ['Brain','Epilepsy','Neurodegeneration','Nervous','Neurological','Alzheimer\'s','Parkinson\'s','Epilepsy','Schizophrenia','Autism','Sclerosis','Bipolar','Huntington\'s','Dementia','Stroke','Migraine','Tourettes']]
gastrointestinal= [keyword.lower() for keyword in ['Gastrointestinal','Digestive','IBS','IBD','Gastroenteritis','Colitis','Appendicitis','Celiac','Barrett\'s']]
respiratory= [keyword.lower() for keyword in ['Bronchitis','COPD','Lung','Pulmonary','Respiratory','Asthma','Pneumonia','Tuberculosis','Emphysema','Pneumothorax']]
hormonal= [keyword.lower() for keyword in ['Endocrine','Hormone','Hormonal','Thyroid','Hyperthyroidism','Hypothyroidism','Cushing\'s','Addison\'s']]
renal_kidney= [keyword.lower() for keyword in ['Urology','Nephrology','Renal','Polycystic','Kidney']]
musculoskeletal= [keyword.lower() for keyword in ['Bone','Osteoporosis','Osteoarthritis','Musculoskeletal','Arthritis','Fibromyalgia']]
eye= [keyword.lower() for keyword in ['Eye','Retinal','Optic','Ophthalmic','Glaucoma','Cataracts','Macular','Retinitis','Pigmentosa']]
blood= [keyword.lower() for keyword in ['Blood','Thrombosis','Lymphocytes','Hematology','Anemia','Leukemia','Hemophilia','Hemolytic']]
metabolic= [keyword.lower() for keyword in ['Metabolic','Metabolism']]
obesity= [keyword.lower() for keyword in ['Obesity','BMI','Adipose']]
toxicity= [keyword.lower() for keyword in ['Toxicity','Toxic']]





In [3]:
#creating nested list of each disease category with the category name as elemnt 1 and keyword list as element 2 
disease_categories = [
    ('Infection',infection),('Virus',virus),('Bacteria',bacteria),('Parasite',parasite),('Fungal',fungal),('Aging',aging),('Cancer',cancer),('Diabetes',diabetes),('Obesity',obesity),('Cardiovascular',cardiovascular),('genetic',genetic),('autoimmune',autoimmune),
    ('Neurological',neurological),('Gastrointestinal',gastrointestinal),('Respiratory',respiratory),('Hormonal',hormonal),('Renal/Kidney',renal_kidney),('Musculoskeletal',musculoskeletal),('Ocular',eye),('Blood',blood),('Metabolic',metabolic),('Toxicity',toxicity)]

def disease_type(aid):
    """
    function that labels an assay with disease category based of matching keywords to text in xml file
    
    aid: str representation of aid number of a PubChem Bioassay 
    
    return: str most common disease category found 
    """
    string = 'https://pubchem.ncbi.nlm.nih.gov/rest/pug_view/data/assay/' + aid + '/XML' #URL with addition of specific aid
    # Requesting for the website
    Web = req.get(string, verify=False) 
    # Creating a BeautifulSoup object and specifying the parser
    S = BeautifulSoup(Web.text, features="xml")
    
    keyword_counter = Counter()  # Counter for counting keyword occurrences
    
    for category_name, category_keywords in disease_categories:
        for keyword in category_keywords: #iterate through each keyword of each disease category 
            if keyword in S.get_text().lower(): #check if keyword is in lowercase text of xml file 
                keyword_counter[category_name] += 1 #add a count if match is found 
    
    if keyword_counter: #if there has been a match, find the category with highest count and return the name
        most_common_category = keyword_counter.most_common(1)[0][0]
        return most_common_category
    else:
        return None  # Return None if no match is found




In [4]:
df=pd.read_csv('final_groups.csv') #open csv file of benchmark data 
disease_type_list=[]
for aid in df['aids']: 
    aid=int(aid) #transform each assay id to an integer 
    result=disease_type(str(aid)) #label disease type by function 
    disease_type_list.append(result) #add to result list 
    



795 most common category: Cancer




1196 most common category: Cancer




1197 most common category: Cancer




1198 most common category: Cancer




1200 most common category: Cancer




1069 most common category: Cancer




1076 most common category: Cancer




588501 most common category: Bacteria




588461 most common category: Bacteria




602142 most common category: Bacteria




602178 most common category: Bacteria




602326 most common category: Bacteria




602327 most common category: Bacteria




624244 most common category: Bacteria




651901 most common category: Bacteria




720672 most common category: Bacteria




588459 most common category: Bacteria




588497 most common category: Bacteria




602140 most common category: Bacteria




602177 most common category: Bacteria




602336 most common category: Bacteria




602338 most common category: Bacteria




624245 most common category: Bacteria




651880 most common category: Bacteria




720671 most common category: Bacteria




588460 most common category: Bacteria




588499 most common category: Bacteria




602139 most common category: Bacteria




602176 most common category: Bacteria




602325 most common category: Bacteria




602328 most common category: Bacteria




624243 most common category: Bacteria




651879 most common category: Bacteria




652102 most common category: Bacteria




720673 most common category: Bacteria




441 most common category: Cancer




440 most common category: Cancer




519 most common category: Cancer




520 most common category: Cancer




698 most common category: Cancer




699 most common category: Cancer




722 most common category: Cancer




724 most common category: Cancer




527 most common category: Infection




700 most common category: Bacteria




1014 most common category: Infection




1015 most common category: Infection




1506 most common category: Infection




1500 most common category: Infection




1507 most common category: Infection




528 most common category: genetic




529 most common category: genetic




2557 most common category: Cancer




2674 most common category: Cancer




2813 most common category: Cancer




449766 most common category: Cancer




488791 most common category: Cancer




588412 most common category: Cancer




588446 most common category: Cancer




588448 most common category: Cancer




1841 most common category: genetic




1884 most common category: genetic




2311 most common category: genetic




1440 most common category: genetic




1415 most common category: genetic




1840 most common category: genetic




1872 most common category: genetic




2295 most common category: genetic




2829 most common category: genetic




1423 most common category: genetic




1836 most common category: genetic




1869 most common category: genetic




2307 most common category: genetic




2827 most common category: genetic




1439 most common category: genetic




1837 most common category: genetic




1871 most common category: genetic




2296 most common category: genetic




2826 most common category: genetic




1441 most common category: genetic




1838 most common category: genetic




1888 most common category: genetic




2298 most common category: genetic




2828 most common category: genetic




751 most common category: Cancer




1062 most common category: Cancer




1207 most common category: Cancer




2132 most common category: Cancer




757 most common category: genetic




764 most common category: genetic




1339 most common category: genetic




1340 most common category: genetic




2027 most common category: genetic




2039 most common category: genetic




2040 most common category: genetic




2048 most common category: genetic




2051 most common category: genetic




2055 most common category: genetic




758 most common category: genetic




1336 most common category: genetic




1760 most common category: genetic




2031 most common category: genetic




2036 most common category: genetic




2041 most common category: genetic




588393 most common category: genetic




588394 most common category: genetic




588631 most common category: genetic




759 most common category: genetic




1335 most common category: genetic




1341 most common category: genetic




1759 most common category: genetic




1761 most common category: genetic




2038 most common category: genetic




2042 most common category: genetic




2043 most common category: genetic




2047 most common category: genetic




2050 most common category: genetic




2053 most common category: genetic




588381 most common category: genetic




588383 most common category: genetic




588387 most common category: genetic




588388 most common category: genetic




588628 most common category: genetic




588630 most common category: genetic




760 most common category: genetic




1337 most common category: genetic




1763 most common category: genetic




2033 most common category: genetic




2045 most common category: genetic




2046 most common category: genetic




761 most common category: genetic




1333 most common category: genetic




1334 most common category: genetic




2009 most common category: genetic




2019 most common category: genetic




2020 most common category: genetic




2021 most common category: genetic




2022 most common category: genetic




588624 most common category: genetic




2037 most common category: genetic




588373 most common category: genetic




588377 most common category: genetic




588384 most common category: genetic




588385 most common category: genetic




588626 most common category: genetic




950 most common category: genetic




1328 most common category: genetic




2075 most common category: genetic




951 most common category: genetic




1327 most common category: genetic




2077 most common category: genetic




952 most common category: genetic




1330 most common category: genetic




2081 most common category: genetic




1007 most common category: genetic




1322 most common category: genetic




2084 most common category: genetic




1008 most common category: genetic




1320 most common category: genetic




2080 most common category: genetic




1009 most common category: genetic




1329 most common category: genetic




2086 most common category: genetic




1210 most common category: Cancer




1218 most common category: Cancer




1221 most common category: Cancer




1211 most common category: Cancer




1223 most common category: Cancer




1226 most common category: Cancer




1212 most common category: Cancer




1213 most common category: Cancer




1219 most common category: Cancer




1224 most common category: Cancer




1325 most common category: Cancer




1453 most common category: Cancer




1480 most common category: Cancer




1690 most common category: Cancer




489003 most common category: Cancer




1326 most common category: Cancer




1451 most common category: Cancer




1483 most common category: Cancer




1689 most common category: Cancer




489002 most common category: Cancer




504566 most common category: Cancer




504569 most common category: Cancer




1529 most common category: genetic




1894 most common category: genetic




1896 most common category: genetic




2145 most common category: genetic




1530 most common category: genetic




1531 most common category: genetic




1892 most common category: genetic




1893 most common category: genetic




1895 most common category: genetic




1897 most common category: genetic




2150 most common category: genetic




2151 most common category: genetic




1862 most common category: Cancer




2025 most common category: Cancer




2270 most common category: Cancer




2623 most common category: Cancer




2740 most common category: Cancer




488808 most common category: Cancer




488814 most common category: Cancer




504336 most common category: Cancer




504470 most common category: Cancer




1867 most common category: Cancer




2016 most common category: Cancer




2272 most common category: Cancer




2622 most common category: Cancer




2742 most common category: Cancer




488801 most common category: Cancer




488812 most common category: Cancer




504321 most common category: Cancer




504468 most common category: Cancer




1873 most common category: Cancer




2023 most common category: Cancer




2271 most common category: Cancer




2621 most common category: Cancer




2745 most common category: Cancer




488795 most common category: Cancer




488823 most common category: Cancer




504338 most common category: Cancer




504469 most common category: Cancer




1870 most common category: Cancer




2029 most common category: Cancer




2274 most common category: Cancer




2624 most common category: Cancer




2744 most common category: Cancer




488825 most common category: Cancer




488827 most common category: Cancer




504340 most common category: Cancer




504461 most common category: Cancer




1887 most common category: Cancer




2066 most common category: Cancer




2273 most common category: Cancer




2643 most common category: Cancer




2743 most common category: Cancer




488790 most common category: Cancer




488792 most common category: Cancer




504334 most common category: Cancer




504458 most common category: Cancer




2052 most common category: autoimmune




2523 most common category: autoimmune




2810 most common category: autoimmune




504565 most common category: autoimmune




485284 most common category: autoimmune




2690 most common category: Aging




2706 most common category: Aging




434994 most common category: Aging




504927 most common category: Aging




504931 most common category: Aging




449753 most common category: Aging




588518 most common category: Fungal




588608 most common category: Fungal




623992 most common category: Fungal




588520 most common category: Fungal




588604 most common category: Fungal




623994 most common category: Fungal




588522 most common category: Fungal




588606 most common category: Fungal




623996 most common category: Fungal




555 most common category: genetic




539 most common category: genetic




549 most common category: genetic




557 most common category: genetic




1000 most common category: genetic




550 most common category: genetic




556 most common category: genetic




1028 most common category: genetic




818 most common category: Cancer




1004 most common category: Cancer




1045 most common category: Cancer




823 most common category: Cancer




824 most common category: Cancer




827 most common category: Cancer




999 most common category: Cancer




1047 most common category: Cancer




868 most common category: genetic




869 most common category: genetic




1307 most common category: genetic




1239 most common category: Neurological




1241 most common category: Neurological




453 most common category: Cancer




488 most common category: genetic




523 most common category: Cancer




820 most common category: Cancer




830 most common category: genetic




460 most common category: Parasite




825 most common category: Parasite




1627 most common category: Parasite




1633 most common category: Parasite




501 most common category: genetic




831 most common category: genetic




538 most common category: genetic




787 most common category: genetic




829 most common category: genetic




581 most common category: genetic




832 most common category: genetic




679 most common category: genetic




680 most common category: genetic




687 most common category: genetic




721 most common category: genetic




798 most common category: genetic




846 most common category: genetic




684 most common category: genetic




701 most common category: genetic




716 most common category: genetic




728 most common category: genetic




800 most common category: genetic




852 most common category: genetic




686 most common category: Cancer




691 most common category: Cancer




688 most common category: genetic




792 most common category: genetic




873 most common category: Cancer




1431 most common category: Cancer




1046 most common category: genetic




1215 most common category: genetic




1230 most common category: Cancer




1394 most common category: Cancer




1442 most common category: Cancer




1444 most common category: Cancer




1385 most common category: Cancer




1435 most common category: Cancer




1436 most common category: Cancer




1437 most common category: Cancer




422 most common category: Cancer




711 most common category: Cancer




436 most common category: genetic




714 most common category: genetic




1068 most common category: Cancer




1134 most common category: Cancer




629 most common category: Cancer




639 most common category: Cancer




713 most common category: Cancer




737 most common category: Cancer




1078 most common category: Cancer




1079 most common category: Cancer




630 most common category: Cancer




715 most common category: Cancer




1058 most common category: Cancer




633 most common category: Cancer




733 most common category: Cancer




1060 most common category: Cancer




782 most common category: genetic




855 most common category: genetic




940 most common category: genetic




1421 most common category: genetic




1422 most common category: genetic




1021 most common category: genetic




1418 most common category: genetic




1022 most common category: genetic




1417 most common category: genetic




1085 most common category: Cancer




1419 most common category: Cancer




1236 most common category: Neurological




1420 most common category: Neurological




1274 most common category: genetic




1275 most common category: Cardiovascular




2732 most common category: genetic




504322 most common category: genetic




504437 most common category: genetic




438 most common category: autoimmune




462 most common category: autoimmune




1023 most common category: autoimmune




707 most common category: Cardiovascular




717 most common category: Cardiovascular




1026 most common category: Cardiovascular




1246 most common category: Cancer




1288 most common category: Cancer




487 most common category: Cancer




517 most common category: Cancer




808 most common category: Cancer




1249 most common category: Cancer




802 most common category: Cancer




1013 most common category: Cancer




449739 most common category: Neurological




504619 most common category: Neurological




489005 most common category: Neurological




493021 most common category: Neurological




493022 most common category: Neurological




493023 most common category: Neurological




493041 most common category: Neurological




1916 most common category: genetic




2753 most common category: genetic




435017 most common category: genetic




1918 most common category: genetic




626 most common category: Neurological




628 most common category: genetic




859 most common category: genetic




743391 most common category: Virus




743400 most common category: Virus




743409 most common category: Virus




602143 most common category: Virus




602147 most common category: Virus




602149 most common category: Virus




624000 most common category: Virus




624004 most common category: Virus




624009 most common category: Virus




602144 most common category: Virus




602150 most common category: Virus




602151 most common category: Virus




624001 most common category: Virus




624003 most common category: Virus




624008 most common category: Virus




743388 most common category: Virus




743389 most common category: Virus




743390 most common category: Virus




567 most common category: genetic




612 most common category: genetic




718 most common category: genetic




613 most common category: genetic




755 most common category: genetic




571 most common category: genetic




574 most common category: genetic




726 most common category: genetic




749 most common category: genetic




624169 most common category: genetic




624381 most common category: genetic




624503 most common category: genetic




720643 most common category: genetic




720582 most common category: Cancer




743208 most common category: Cancer




743254 most common category: Cancer




743256 most common category: Cancer




743259 most common category: Cancer




743338 most common category: Cancer




720648 most common category: Cancer




743214 most common category: Cancer




743253 most common category: Cancer




743257 most common category: Cancer




743260 most common category: Cancer




743337 most common category: Cancer




435030 most common category: Bacteria




449728 most common category: Bacteria




488942 most common category: Bacteria




488956 most common category: Bacteria




492958 most common category: Bacteria




492959 most common category: Bacteria




504677 most common category: Bacteria




504678 most common category: Bacteria




651942 most common category: Bacteria




651943 most common category: Bacteria




651572 most common category: Cancer




651608 most common category: Cancer




651763 most common category: Cancer




743243 most common category: Cancer




652035 most common category: autoimmune




686958 most common category: autoimmune




651800 most common category: autoimmune




652036 most common category: autoimmune




686957 most common category: autoimmune




1962 most common category: Fungal




2149 most common category: Fungal




2160 most common category: Fungal




2153 most common category: Fungal




2167 most common category: Fungal




2837 most common category: Fungal




2838 most common category: Fungal




434933 most common category: Fungal




434934 most common category: Fungal




2797 most common category: genetic




434964 most common category: genetic




434991 most common category: genetic




463108 most common category: genetic




463127 most common category: genetic




2796 most common category: genetic




2845 most common category: genetic




463088 most common category: genetic




493060 most common category: genetic




624377 most common category: Cancer




624431 most common category: Cancer




651680 most common category: Cancer




2129 most common category: Cancer




2166 most common category: Cancer




2218 most common category: Cancer




2790 most common category: Cancer




624268 most common category: Parasite




624412 most common category: Parasite




651607 most common category: Parasite




651971 most common category: Parasite




651989 most common category: Parasite




686967 most common category: Parasite




743060 most common category: Parasite




720622 most common category: Parasite




743061 most common category: Parasite




743068 most common category: Parasite




743153 most common category: Parasite




743154 most common category: Parasite




743301 most common category: Parasite




1053132 most common category: Parasite




1053134 most common category: Parasite




1053198 most common category: Parasite




1053201 most common category: Parasite




1053204 most common category: Parasite




1053203 most common category: Parasite




686969 most common category: Parasite




720623 most common category: Parasite




743299 most common category: Parasite




743300 most common category: Parasite




2234 most common category: Cancer




2328 most common category: Cancer




2361 most common category: Cancer




2377 most common category: Cancer




488998 most common category: Cancer




504707 most common category: Cancer




504799 most common category: Cancer




504800 most common category: Cancer




504887 most common category: Cancer




504896 most common category: Cancer




588839 most common category: Cancer




504700 most common category: Cancer




504796 most common category: Cancer




504797 most common category: Cancer




504888 most common category: Cancer




504893 most common category: Cancer




588841 most common category: Cancer




463141 most common category: Cancer




488954 most common category: Cancer




489014 most common category: Cancer




493114 most common category: Cancer




504328 most common category: Cancer




504816 most common category: Cancer




504824 most common category: Cancer




463210 most common category: Cancer




488941 most common category: Cancer




489013 most common category: Cancer




493115 most common category: Cancer




504330 most common category: Cancer




504814 most common category: Cancer




504822 most common category: Cancer




624267 most common category: genetic




624370 most common category: genetic




651553 most common category: genetic




651962 most common category: genetic




652166 most common category: genetic




1906 most common category: genetic




2178 most common category: genetic




2196 most common category: genetic




720577 most common category: Infection




720578 most common category: Infection




743296 most common category: Infection




651958 most common category: Infection




686976 most common category: Infection




493232 most common category: genetic




504717 most common category: genetic




624407 most common category: genetic




588814 most common category: Neurological




588819 most common category: Neurological




588852 most common category: Neurological




463079 most common category: genetic




492965 most common category: genetic




504718 most common category: genetic




624408 most common category: genetic




1879 most common category: Respiratory




1706 most common category: Respiratory




1890 most common category: Respiratory




488958 most common category: Respiratory




488999 most common category: Respiratory




588771 most common category: Respiratory




588786 most common category: Respiratory




602486 most common category: Respiratory




652067 most common category: genetic




743032 most common category: genetic




743038 most common category: genetic




743050 most common category: genetic




743059 most common category: genetic




687014 most common category: genetic




652126 most common category: genetic




720734 most common category: genetic




720509 most common category: Cancer




720621 most common category: Cancer




720631 most common category: Cancer




720729 most common category: Cancer




1053129 most common category: Cancer




1053202 most common category: Cancer




720508 most common category: Cancer




720628 most common category: Cancer




720730 most common category: Cancer




1053128 most common category: Cancer




504326 most common category: genetic




504357 most common category: genetic




504900 most common category: genetic




504904 most common category: genetic




588407 most common category: genetic




588411 most common category: genetic




602194 most common category: genetic




602264 most common category: genetic




651685 most common category: genetic




651686 most common category: genetic




651762 most common category: genetic




651764 most common category: genetic




651904 most common category: Toxicity




588435 most common category: genetic




624380 most common category: genetic




624499 most common category: genetic




720642 most common category: genetic




651689 most common category: genetic




651769 most common category: genetic




652034 most common category: genetic




652081 most common category: genetic




504411 most common category: genetic




504445 most common category: genetic




602354 most common category: genetic




602337 most common category: Neurological




602320 most common category: genetic




624468 most common category: genetic




1950 most common category: Cancer




2292 most common category: Cancer




2362 most common category: Cancer




2381 most common category: Cancer




489000 most common category: Cancer




493079 most common category: Cancer




588762 most common category: Cancer




1416 most common category: Cancer




1522 most common category: Cancer




1528 most common category: Cancer




651571 most common category: autoimmune




651604 most common category: autoimmune




651848 most common category: autoimmune




624416 most common category: autoimmune




651937 most common category: autoimmune




651939 most common category: autoimmune




488955 most common category: Bacteria




492957 most common category: Bacteria




504679 most common category: Bacteria




651944 most common category: Bacteria




651982 most common category: genetic




652151 most common category: genetic




651602 most common category: genetic




2174 most common category: Cancer




2233 most common category: Cancer




504510 most common category: Cancer




651998 most common category: Cancer




652003 most common category: Cancer




2177 most common category: Cancer




2232 most common category: Cancer




652001 most common category: Cancer




493110 most common category: Cancer




493161 most common category: Cancer




651990 most common category: Cancer




651991 most common category: Cancer




743118 most common category: Cancer




743119 most common category: Cancer




743127 most common category: Cancer




743132 most common category: Cancer




652145 most common category: Bacteria




588726 most common category: Bacteria




651616 most common category: Bacteria




652135 most common category: Bacteria




588504 most common category: genetic




588505 most common category: genetic




540364 most common category: genetic




588350 most common category: genetic




588351 most common category: genetic




651790 most common category: genetic




651792 most common category: genetic




651719 most common category: genetic




652245 most common category: genetic




687013 most common category: genetic




743095 most common category: genetic




652268 most common category: genetic




687015 most common category: genetic




743092 most common category: genetic




803 most common category: genetic




864 most common category: genetic




865 most common category: Cancer




1050 most common category: genetic




1228 most common category: Cancer




828 most common category: genetic




866 most common category: genetic




867 most common category: Cancer




1225 most common category: genetic




1238 most common category: Cancer




784 most common category: genetic




1268 most common category: genetic




2280 most common category: genetic




2459 most common category: genetic




2802 most common category: genetic




488797 most common category: genetic




1974 most common category: Cancer




2176 most common category: Cancer




463081 most common category: Cancer




463094 most common category: Cancer




463098 most common category: Cancer




463142 most common category: Cancer




651953 most common category: genetic




686987 most common category: genetic




686989 most common category: genetic




743237 most common category: genetic




434989 most common category: genetic




485270 most common category: genetic




492963 most common category: genetic




492964 most common category: genetic




504699 most common category: genetic




504701 most common category: genetic




624409 most common category: genetic




624410 most common category: genetic




1899 most common category: Cancer




2159 most common category: Cancer




463085 most common category: Cancer




485271 most common category: Cancer




2152 most common category: Cancer




485280 most common category: Cancer




2488 most common category: Cancer




651577 most common category: Cancer




504933 most common category: Cancer




651611 most common category: Cancer




651615 most common category: Cancer




651969 most common category: Cancer




651973 most common category: Cancer




651974 most common category: Cancer




651975 most common category: Cancer




588794 most common category: Cancer




602167 most common category: Cancer




651781 most common category: Cancer




588824 most common category: Cancer




602236 most common category: Cancer




651794 most common category: Cancer




624379 most common category: Ocular




624395 most common category: Ocular




651846 most common category: Ocular




687007 most common category: Cancer




720547 most common category: Cancer




743283 most common category: Cancer




651674 most common category: Cardiovascular




651760 most common category: Cardiovascular




652123 most common category: Cardiovascular




652137 most common category: Cardiovascular




1789 most common category: Cancer




1846 most common category: Cancer




1847 most common category: Cancer




1912 most common category: Cancer




1913 most common category: Cancer




2747 most common category: Cancer




2748 most common category: Cancer




652181 most common category: Cancer




1203 most common category: Neurological




1252 most common category: Neurological




434962 most common category: genetic




435028 most common category: genetic




449730 most common category: Diabetes




463220 most common category: genetic




588709 most common category: Diabetes




588711 most common category: genetic




588712 most common category: genetic




588718 most common category: Diabetes




493087 most common category: genetic




588439 most common category: genetic




588681 most common category: genetic




1825 most common category: Cancer




1905 most common category: Cancer




2749 most common category: Cancer




434956 most common category: Cancer




1907 most common category: Cancer




485336 most common category: Cancer




1700 most common category: Cancer




1834 most common category: Cancer




1973 most common category: Cancer




2750 most common category: Cancer




434957 most common category: Cancer




2165 most common category: genetic




1446 most common category: genetic




1521 most common category: genetic




1691 most common category: genetic




1699 most common category: genetic




624413 most common category: Parasite




651972 most common category: Parasite




686968 most common category: Parasite




686952 most common category: Cancer




720493 most common category: Cancer




652039 most common category: Cancer




686949 most common category: Cancer




720500 most common category: Cancer




746 most common category: genetic




1284 most common category: Neurological




686964 most common category: Cancer




720531 most common category: Cancer




720645 most common category: Cancer




1053169 most common category: Cancer




540295 most common category: genetic




540308 most common category: genetic




602298 most common category: genetic




602193 most common category: genetic




602195 most common category: genetic




602263 most common category: genetic




602305 most common category: genetic




651547 most common category: genetic




651555 most common category: genetic




651557 most common category: genetic




2057 most common category: Cancer




2168 most common category: Cancer




2217 most common category: Cancer




2791 most common category: Cancer




602165 most common category: Cancer




1448 most common category: genetic




1525 most common category: genetic




1526 most common category: genetic




1562 most common category: genetic




1660 most common category: genetic




2510 most common category: genetic




2694 most common category: genetic




2719 most common category: genetic




602128 most common category: genetic




602129 most common category: genetic




2148 most common category: genetic




2257 most common category: genetic




463250 most common category: genetic




588563 most common category: genetic




588581 most common category: genetic




1159602 most common category: genetic




1159604 most common category: genetic




1159605 most common category: genetic




602163 most common category: Respiratory




602270 most common category: Respiratory




623963 most common category: Respiratory




624497 most common category: Respiratory




651718 most common category: Respiratory




651822 most common category: Respiratory




651967 most common category: Respiratory




1792 most common category: Cancer




2154 most common category: Cancer




2532 most common category: Cancer




2538 most common category: Cancer




2539 most common category: Cancer




2541 most common category: Cancer




2545 most common category: Cancer




2556 most common category: Cancer




2664 most common category: Cancer




2752 most common category: Cancer




2773 most common category: Cancer




2808 most common category: Cancer




2819 most common category: Cancer




434953 most common category: Cancer




434974 most common category: Cancer




434997 most common category: Cancer




435002 most common category: Cancer




435009 most common category: Cancer




435013 most common category: Cancer




631 most common category: Cancer




1319 most common category: Cancer




1300 most common category: Cancer




1679 most common category: Cancer




588354 most common category: Cancer




588820 most common category: Cancer




602168 most common category: Cancer




602235 most common category: Cancer




651786 most common category: Cancer




651796 most common category: Cancer




651782 most common category: Cancer




651799 most common category: Cancer




651957 most common category: Cancer




652008 most common category: Cancer




651779 most common category: Cancer




731 most common category: Cancer




1301 most common category: Cancer




1331 most common category: Cancer




1684 most common category: Cancer




588352 most common category: Cancer




588792 most common category: Cancer




602166 most common category: Cancer




602234 most common category: Cancer




651788 most common category: Cancer




651797 most common category: Cancer




1861 most common category: genetic




1952 most common category: genetic




2251 most common category: genetic




463251 most common category: genetic




485339 most common category: genetic




588566 most common category: genetic




588583 most common category: genetic




1040 most common category: Cancer




1254 most common category: Cancer




1256 most common category: genetic




1277 most common category: Cancer




1279 most common category: genetic




1304 most common category: Cancer




1546 most common category: Cancer




1651 most common category: genetic




1697 most common category: Cancer




1702 most common category: genetic




2208 most common category: Cancer




2209 most common category: Cancer




2211 most common category: genetic




2212 most common category: genetic




793 most common category: genetic




1255 most common category: Cancer




1257 most common category: genetic




1272 most common category: genetic




1278 most common category: Cancer




1359 most common category: genetic




1539 most common category: genetic




1649 most common category: Cancer




1698 most common category: Cancer




1710 most common category: genetic




2142 most common category: Neurological




2207 most common category: Cancer




2210 most common category: genetic




2219 most common category: Cancer




2220 most common category: genetic




463143 most common category: Cardiovascular




463150 most common category: Cardiovascular




720737 most common category: genetic




743027 most common category: genetic




743037 most common category: genetic




743051 most common category: genetic




743052 most common category: genetic




434939 most common category: genetic




463086 most common category: genetic




493061 most common category: genetic




686940 most common category: Cancer




687008 most common category: Cancer




720548 most common category: Cancer




743284 most common category: Cancer




488782 most common category: Cancer




602396 most common category: Cancer




651613 most common category: Cancer




651970 most common category: Cancer




651976 most common category: Cancer




1800 most common category: Infection




1845 most common category: Infection




1943 most common category: Infection




1945 most common category: Infection




2172 most common category: Infection




2173 most common category: Infection




2474 most common category: Infection




2476 most common category: Infection




623966 most common category: Infection




623968 most common category: genetic




623970 most common category: Infection




623972 most common category: Infection




623973 most common category: Infection




504766 most common category: Cancer




588797 most common category: Cancer




588821 most common category: Cancer




588822 most common category: Cancer




624313 most common category: Cancer




652010 most common category: Cancer




652134 most common category: Cancer




687017 most common category: Cancer




652031 most common category: genetic




652032 most common category: genetic




652077 most common category: genetic




652084 most common category: genetic




2435 most common category: genetic




2445 most common category: genetic




434963 most common category: genetic




434969 most common category: genetic




434985 most common category: genetic




463103 most common category: genetic




463125 most common category: genetic




463128 most common category: genetic




492956 most common category: Cardiovascular




493030 most common category: Cardiovascular




504494 most common category: Cardiovascular




504496 most common category: Cardiovascular




493027 most common category: Cardiovascular




504317 most common category: Cardiovascular




651766 most common category: Cardiovascular




652125 most common category: Cardiovascular




493035 most common category: Cardiovascular




504319 most common category: Cardiovascular




602281 most common category: Cardiovascular




651612 most common category: Cardiovascular




651677 most common category: Cardiovascular




651733 most common category: Cardiovascular




651759 most common category: Cardiovascular




651761 most common category: Cardiovascular




652124 most common category: Cardiovascular




652130 most common category: Cardiovascular




652138 most common category: Cardiovascular




1822 most common category: genetic




2170 most common category: genetic




2195 most common category: genetic




2215 most common category: genetic




492974 most common category: genetic




492975 most common category: genetic




743126 most common category: genetic




743280 most common category: genetic




743457 most common category: genetic




2300 most common category: Ocular




2379 most common category: Ocular




2758 most common category: Ocular




463256 most common category: Ocular




602229 most common category: Ocular




624378 most common category: Ocular




624394 most common category: Ocular




651849 most common category: Ocular




463082 most common category: Cardiovascular




463230 most common category: Cardiovascular




588766 most common category: Cardiovascular




588769 most common category: Cardiovascular




588770 most common category: Cardiovascular




720704 most common category: Neurological




743261 most common category: Neurological




743328 most common category: Neurological




2759 most common category: Ocular




463257 most common category: Ocular




504787 most common category: Ocular




1032 most common category: Cancer




1297 most common category: Cancer




1323 most common category: Cancer




1681 most common category: Cancer




504446 most common category: Cancer




504447 most common category: Cancer




504452 most common category: Cancer




504453 most common category: Cancer




504939 most common category: Cancer




504943 most common category: Cancer




2130 most common category: Cancer




2171 most common category: Cancer




2291 most common category: Cancer




2363 most common category: Cancer




2368 most common category: Cancer




2369 most common category: Cancer




463124 most common category: Cancer




463130 most common category: Cancer




463131 most common category: Cancer




2235 most common category: Cancer




2355 most common category: Cancer




2358 most common category: Cancer




2394 most common category: Cancer




2403 most common category: Cancer




624446 most common category: Cancer




652112 most common category: Diabetes




652207 most common category: Diabetes




652216 most common category: Diabetes




652220 most common category: Diabetes




652222 most common category: Diabetes




652227 most common category: Diabetes




652232 most common category: Diabetes




1987 most common category: Cancer




2331 most common category: Cancer




2360 most common category: Cancer




2395 most common category: Cancer




2422 most common category: Cancer




463224 most common category: Cancer




624425 most common category: Cancer




624432 most common category: Cancer




624433 most common category: Cancer




624439 most common category: Cancer




624447 most common category: Cancer




624448 most common category: Cancer




652111 most common category: Diabetes




652225 most common category: Diabetes




652226 most common category: Diabetes




652230 most common category: Diabetes




463073 most common category: genetic




485272 most common category: genetic




488796 most common category: genetic




492970 most common category: genetic




588416 most common category: genetic




588417 most common category: genetic




588418 most common category: genetic




588419 most common category: genetic




588420 most common category: genetic




588421 most common category: genetic




588422 most common category: genetic




588423 most common category: genetic




743269 most common category: genetic




1053171 most common category: genetic




1053172 most common category: genetic




602125 most common category: genetic




602182 most common category: genetic




602397 most common category: genetic




624123 most common category: genetic




686965 most common category: genetic




588664 most common category: genetic




602124 most common category: genetic




602181 most common category: genetic




602398 most common category: genetic




624124 most common category: genetic




686966 most common category: genetic




651821 most common category: genetic




652065 most common category: genetic




652068 most common category: genetic




686959 most common category: genetic




686960 most common category: genetic




720649 most common category: genetic




2277 most common category: Cardiovascular




463148 most common category: Cardiovascular




561 most common category: genetic




463152 most common category: Cardiovascular




1509 most common category: Cardiovascular




1510 most common category: Cardiovascular




1523 most common category: Cardiovascular




1524 most common category: Cardiovascular




1686 most common category: Cardiovascular




1692 most common category: Cardiovascular




2332 most common category: Cardiovascular




2346 most common category: Cardiovascular




463107 most common category: Cardiovascular




463225 most common category: Cardiovascular




504460 most common category: Cardiovascular




504871 most common category: Cardiovascular




504876 most common category: Cardiovascular




504917 most common category: Cardiovascular




504918 most common category: Cardiovascular




504919 most common category: Cardiovascular




504921 most common category: Cardiovascular




504923 most common category: Cardiovascular




504924 most common category: Cardiovascular




624371 most common category: genetic




651961 most common category: genetic




651552 most common category: genetic




652017 most common category: Cancer




652260 most common category: Cancer




686939 most common category: Cancer




686991 most common category: Cancer




686995 most common category: Cancer




720660 most common category: Cancer




720661 most common category: Cancer




729 most common category: Cancer




736 most common category: Cancer




872 most common category: Cancer




874 most common category: Cancer




485 most common category: Cardiovascular




1429 most common category: Cardiovascular




1518 most common category: Cardiovascular




484 most common category: Cardiovascular




920 most common category: Cancer




1263 most common category: Cancer




1303 most common category: Cancer




1317 most common category: Cancer




1396 most common category: Cancer




1411 most common category: Cancer




2772 most common category: Cancer




932 most common category: Cancer




1262 most common category: Cancer




1306 most common category: Cancer




1318 most common category: Cancer




1397 most common category: Cancer




1406 most common category: Cancer




434932 most common category: Cancer




434988 most common category: Cancer




449760 most common category: Cancer




862 most common category: Cancer




1265 most common category: Cancer




1267 most common category: Cancer




1310 most common category: Cancer




2078 most common category: Cancer




2771 most common category: Cancer




871 most common category: Cancer




1316 most common category: Cancer




1398 most common category: Cancer




1404 most common category: Cancer




2049 most common category: Cancer




1399 most common category: Cancer




1409 most common category: Cancer




651614 most common category: Cancer




651968 most common category: Cancer




651977 most common category: Cancer




588341 most common category: autoimmune




540251 most common category: autoimmune




504734 most common category: autoimmune




540250 most common category: autoimmune




588336 most common category: autoimmune




588339 most common category: autoimmune




588340 most common category: autoimmune




624466 most common category: genetic




651785 most common category: genetic




651955 most common category: genetic




686986 most common category: genetic




686994 most common category: genetic




743234 most common category: genetic




743235 most common category: genetic




1053182 most common category: genetic




1117265 most common category: genetic




624467 most common category: genetic




651783 most common category: genetic




651951 most common category: genetic




686984 most common category: genetic




686985 most common category: genetic




743229 most common category: genetic




743231 most common category: genetic




743490 most common category: genetic




743491 most common category: genetic




1053177 most common category: genetic




1053178 most common category: genetic




1053181 most common category: genetic




1424 most common category: genetic




1538 most common category: genetic




1682 most common category: genetic




2583 most common category: genetic




2692 most common category: genetic




493244 most common category: genetic




504635 most common category: genetic




504742 most common category: genetic




1117267 most common category: genetic




1117279 most common category: genetic




1117280 most common category: genetic




1117296 most common category: genetic




1117297 most common category: genetic




720702 most common category: Cancer




743263 most common category: Cancer




743297 most common category: Cancer




1083212 most common category: Cancer




687016 most common category: Cancer




720530 most common category: Cancer




720644 most common category: Cancer




1053170 most common category: Cancer




1481 most common category: Cancer




1517 most common category: Cancer




1534 most common category: Cancer




1544 most common category: Cancer




1551 most common category: Cancer




1629 most common category: Cancer




2131 most common category: Cancer




1556 most common category: Bacteria




1857 most common category: Bacteria




1860 most common category: Bacteria




1919 most common category: Bacteria




1920 most common category: Bacteria




1925 most common category: Infection




1926 most common category: Bacteria




1927 most common category: Bacteria




2184 most common category: Bacteria




2187 most common category: Bacteria




2189 most common category: Bacteria




2317 most common category: Bacteria




2754 most common category: Bacteria




2755 most common category: Infection




2756 most common category: Bacteria




2767 most common category: Bacteria




2768 most common category: Bacteria




2769 most common category: Bacteria




1321 most common category: Cancer




1410 most common category: Cancer




1412 most common category: Cancer




1413 most common category: Cancer




2088 most common category: Cancer




463080 most common category: Cancer




463169 most common category: Cancer




651560 most common category: genetic




651700 most common category: genetic




652005 most common category: genetic




686962 most common category: genetic




686963 most common category: genetic




743307 most common category: genetic




743308 most common category: genetic




2544 most common category: genetic




434927 most common category: genetic




463135 most common category: genetic




488793 most common category: genetic




488874 most common category: genetic




493137 most common category: genetic




493142 most common category: genetic




540265 most common category: genetic




540274 most common category: genetic




813 most common category: genetic




1056 most common category: genetic




1136 most common category: genetic




1450 most common category: genetic




1659 most common category: genetic




1941 most common category: genetic




489030 most common category: Cancer




504614 most common category: Cancer




504615 most common category: Cancer




588524 most common category: Cancer




588538 most common category: Cancer




588555 most common category: Cancer




602460 most common category: Cancer




489031 most common category: Cancer




504616 most common category: Cancer




504617 most common category: Cancer




588554 most common category: Cancer




588572 most common category: Cancer




588592 most common category: Cancer




602469 most common category: Cancer




493011 most common category: genetic




493151 most common category: genetic




504714 most common category: genetic




504724 most common category: genetic




588857 most common category: genetic




624089 most common category: genetic




493012 most common category: genetic




493152 most common category: genetic




504715 most common category: genetic




504719 most common category: genetic




602135 most common category: genetic




602136 most common category: genetic




624087 most common category: genetic




504462 most common category: Cancer




504756 most common category: Cancer




504757 most common category: Cancer




588584 most common category: Cancer




435022 most common category: Cancer




489023 most common category: Cancer




504485 most common category: Cancer




504508 most common category: Cancer




504515 most common category: Cancer




504516 most common category: Cancer




504518 most common category: Cancer




504528 most common category: Toxicity




504641 most common category: Cancer




504690 most common category: Parasite




504753 most common category: Parasite




504765 most common category: Parasite




504862 most common category: Aging




504863 most common category: Aging




540252 most common category: Parasite




540269 most common category: Parasite




588415 most common category: Parasite




588588 most common category: Parasite




588593 most common category: Parasite




588671 most common category: Parasite




602131 most common category: Parasite




602132 most common category: Parasite




602133 most common category: Parasite




602423 most common category: Parasite




602425 most common category: Parasite




488857 most common category: autoimmune




488863 most common category: autoimmune




488901 most common category: genetic




488918 most common category: genetic




504488 most common category: genetic




588599 most common category: genetic




651565 most common category: Cancer




1496 most common category: genetic




1502 most common category: genetic




1550 most common category: genetic




1560 most common category: genetic




588473 most common category: genetic




602473 most common category: genetic




651648 most common category: genetic




588475 most common category: genetic




602180 most common category: genetic




651639 most common category: genetic




651649 most common category: genetic




493091 most common category: genetic




540281 most common category: genetic




540297 most common category: genetic




540313 most common category: genetic




588850 most common category: genetic




602472 most common category: genetic




624344 most common category: genetic




651592 most common category: genetic




686954 most common category: Cancer




720701 most common category: Cancer




588458 most common category: genetic




602382 most common category: genetic




602385 most common category: genetic




602386 most common category: genetic




602387 most common category: genetic




1957 most common category: Cancer




1958 most common category: Cancer




1992 most common category: Cancer




2684 most common category: Cancer




449733 most common category: Cancer




488861 most common category: Cancer




540288 most common category: Cancer




652176 most common category: genetic




652193 most common category: genetic




504720 most common category: genetic




588481 most common category: genetic




588502 most common category: genetic




588602 most common category: genetic




588603 most common category: genetic




602261 most common category: Cancer




624325 most common category: Cancer




624326 most common category: Cancer




624327 most common category: Cancer




651670 most common category: Cancer




652164 most common category: Cancer




652165 most common category: Cancer




652286 most common category: Cancer




652287 most common category: Cancer




1347040 most common category: Cancer




651636 most common category: genetic




651997 most common category: genetic




652000 most common category: genetic




743408 most common category: autoimmune




743410 most common category: genetic




743411 most common category: autoimmune




588413 most common category: Cancer




602428 most common category: Cancer




602464 most common category: Cancer




651836 most common category: Cancer




651837 most common category: Cancer




651994 most common category: Cancer




651995 most common category: Cancer




463219 most common category: genetic




504443 most common category: genetic




504422 most common category: Obesity




463191 most common category: Obesity




493092 most common category: Obesity




504440 most common category: Obesity




1656 most common category: Obesity




463183 most common category: Obesity




493160 most common category: Diabetes




504710 most common category: Diabetes




504729 most common category: Diabetes




504763 most common category: genetic




540304 most common category: Diabetes




588355 most common category: Diabetes




588452 most common category: Diabetes




624352 most common category: Cancer




651580 most common category: Cancer




651581 most common category: Cancer




652011 most common category: Cancer




624168 most common category: genetic




651671 most common category: genetic




651675 most common category: genetic




651684 most common category: genetic




485346 most common category: Cancer




489028 most common category: Cancer




504593 most common category: Cancer




504601 most common category: Cancer




504609 most common category: Cancer




504607 most common category: Cancer




651561 most common category: Aging




624504 most common category: Aging




60249 most common category: genetic




651647 most common category: Cancer




652235 most common category: Cancer




652242 most common category: Cancer




652244 most common category: Cancer




652246 most common category: Cancer




652252 most common category: Cancer




652267 most common category: Cancer




652271 most common category: Cancer




588492 most common category: Cardiovascular




588780 most common category: Cardiovascular




602210 most common category: Cardiovascular




602211 most common category: Cardiovascular




623867 most common category: Cardiovascular




623871 most common category: Cardiovascular




623872 most common category: Cardiovascular




623873 most common category: Cardiovascular




624454 most common category: Cardiovascular




624458 most common category: Cardiovascular




624460 most common category: Cardiovascular




651709 most common category: Bacteria




624309 most common category: Bacteria




624317 most common category: Bacteria




602399 most common category: Bacteria




651699 most common category: Cancer




652217 most common category: Cancer




652247 most common category: Cancer




493036 most common category: Cancer




504549 most common category: Cancer




504550 most common category: Cancer




588503 most common category: Cancer




602356 most common category: Cancer




602426 most common category: Cancer




602427 most common category: genetic




602459 most common category: genetic




602482 most common category: Cancer




588495 most common category: Cancer




602334 most common category: Cancer




651650 most common category: Cancer




602438 most common category: Cancer




2071 most common category: autoimmune




488841 most common category: autoimmune




488860 most common category: autoimmune




2825 most common category: autoimmune




435006 most common category: autoimmune




488784 most common category: autoimmune




488794 most common category: autoimmune




488799 most common category: autoimmune




488800 most common category: autoimmune




602274 most common category: genetic




623861 most common category: genetic




624145 most common category: genetic




651676 most common category: genetic




588405 most common category: Cancer




602417 most common category: Cancer




624167 most common category: Cancer




651549 most common category: Cancer




651551 most common category: Cancer




512194 most common category: Cancer




602361 most common category: Cancer




602318 most common category: Cancer




602330 most common category: Cancer




602333 most common category: Cancer




602368 most common category: Cancer




602369 most common category: Cancer




652285 most common category: Cancer




686916 most common category: Cancer




686917 most common category: Cancer




686918 most common category: Cancer




686932 most common category: Cancer




588621 most common category: genetic




602367 most common category: genetic




602372 most common category: genetic




602374 most common category: genetic




623866 most common category: genetic




624207 most common category: genetic




624241 most common category: genetic




2599 most common category: genetic




488915 most common category: genetic




488921 most common category: genetic




504492 most common category: genetic




588598 most common category: genetic




624204 most common category: Cancer




651678 most common category: Cancer




651690 most common category: Cancer




651693 most common category: Cancer




651697 most common category: Cancer




2540 most common category: genetic




488903 most common category: genetic




488912 most common category: genetic




602440 most common category: Cancer




624319 most common category: Cancer




624322 most common category: Cancer




651559 most common category: genetic




624304 most common category: genetic




624474 most common category: genetic




651563 most common category: genetic




651996 most common category: genetic




652140 most common category: genetic




652265 most common category: genetic




743022 most common category: genetic




602429 most common category: Cancer




624382 most common category: Cancer




624383 most common category: Cancer




624384 most common category: Cancer




624385 most common category: Cancer




434973 most common category: genetic




488904 most common category: genetic




488917 most common category: genetic




504497 most common category: genetic




588600 most common category: genetic




2069 most common category: Cancer




2006 most common category: Cancer




2018 most common category: Cancer




2614 most common category: Cancer




485337 most common category: Cancer




485374 most common category: Cancer




485391 most common category: Cancer




488777 most common category: Cancer




435003 most common category: Cancer




435020 most common category: Cancer




489033 most common category: Cancer




489035 most common category: Cancer




489041 most common category: Cancer




504487 most common category: Cancer




504489 most common category: Cancer




504514 most common category: Cancer




504517 most common category: Cancer




504671 most common category: Cancer




504664 most common category: Cancer




463190 most common category: Cancer




463195 most common category: Cancer




463213 most common category: Cancer




463215 most common category: Cancer




493003 most common category: Cancer




504542 most common category: Cancer




504657 most common category: Cancer




504672 most common category: Cancer




602378 most common category: Cancer




602380 most common category: Cancer




463212 most common category: Cancer




463218 most common category: Cancer




493002 most common category: Cancer




504544 most common category: Cancer




602375 most common category: Cancer




624354 most common category: Cancer




651596 most common category: Cancer




652002 most common category: Cancer




651582 most common category: Diabetes




651629 most common category: Diabetes




651630 most common category: Diabetes




743160 most common category: Diabetes




743161 most common category: Diabetes




743168 most common category: Diabetes




743170 most common category: Diabetes




2520 most common category: genetic




2764 most common category: genetic




488748 most common category: genetic




488811 most common category: genetic




488865 most common category: genetic




488881 most common category: genetic




488985 most common category: genetic




492985 most common category: genetic




492986 most common category: genetic




492982 most common category: genetic




493183 most common category: genetic




493202 most common category: genetic




504524 most common category: genetic




504532 most common category: genetic




2521 most common category: genetic




2766 most common category: genetic




2784 most common category: genetic




463109 most common category: genetic




488803 most common category: genetic




488992 most common category: genetic




504436 most common category: genetic




504455 most common category: genetic




493098 most common category: Cancer




504728 most common category: Cancer




540334 most common category: Cancer




651940 most common category: Cancer




602244 most common category: Cancer




602409 most common category: Cancer




624129 most common category: Cancer




651598 most common category: Cancer




651601 most common category: Cancer




651708 most common category: Cancer




651919 most common category: Cancer




449763 most common category: Cancer




463104 most common category: genetic




463112 most common category: Cancer




485299 most common category: genetic




489024 most common category: Cancer




489027 most common category: Cancer




489032 most common category: genetic




489040 most common category: genetic




540305 most common category: genetic




540306 most common category: Cancer




540311 most common category: genetic




540312 most common category: Cancer




588556 most common category: Cancer




588557 most common category: Cancer




588558 most common category: genetic




588565 most common category: genetic




588567 most common category: Cancer




588569 most common category: genetic




588570 most common category: genetic




588571 most common category: Cancer




588580 most common category: genetic




588582 most common category: genetic




588594 most common category: Cancer




588597 most common category: Cancer




485273 most common category: autoimmune




488859 most common category: autoimmune




493155 most common category: autoimmune




493182 most common category: autoimmune




504687 most common category: autoimmune




588390 most common category: autoimmune




602205 most common category: autoimmune




602404 most common category: autoimmune




1745852 most common category: genetic




1745853 most common category: genetic




2404 most common category: genetic




1672 most common category: Cardiovascular




2032 most common category: genetic




2105 most common category: genetic




2236 most common category: genetic




2345 most common category: genetic




2581 most common category: genetic




2591 most common category: genetic




2594 most common category: genetic




504555 most common category: genetic




504557 most common category: genetic




504559 most common category: genetic




504693 most common category: genetic




504694 most common category: genetic




504695 most common category: genetic




504828 most common category: genetic




488922 most common category: Cancer




492992 most common category: Cancer




492993 most common category: genetic




492997 most common category: Cancer




504846 most common category: Aging




504902 most common category: Aging




504922 most common category: genetic




540321 most common category: genetic




540323 most common category: genetic




540324 most common category: Aging




588724 most common category: Aging




588759 most common category: Aging




588760 most common category: genetic




623881 most common category: genetic




623884 most common category: Aging




623887 most common category: Aging




2156 most common category: genetic




493025 most common category: genetic




493026 most common category: genetic




493029 most common category: genetic




493037 most common category: genetic




493039 most common category: Neurological




588425 most common category: Neurological




588426 most common category: Neurological




588637 most common category: Neurological




2239 most common category: genetic




2282 most common category: genetic




2287 most common category: genetic




2408 most common category: genetic




2415 most common category: genetic




2432 most common category: genetic




2443 most common category: genetic




2548 most common category: genetic




2558 most common category: genetic




2603 most common category: genetic




2654 most common category: genetic




493038 most common category: Neurological




493042 most common category: Neurological




493043 most common category: Neurological




493044 most common category: Neurological




493113 most common category: Neurological




504416 most common category: genetic




504417 most common category: genetic




504418 most common category: genetic




463111 most common category: Cardiovascular




602282 most common category: genetic




602283 most common category: Aging




624166 most common category: Cardiovascular




488975 most common category: Neurological




493221 most common category: Neurological




493222 most common category: Neurological




504840 most common category: Neurological




588401 most common category: Neurological




602208 most common category: Neurological




488977 most common category: Neurological




651756 most common category: Neurological




504833 most common category: Neurological




602376 most common category: Neurological




623908 most common category: Neurological




651748 most common category: Neurological




504554 most common category: genetic




504866 most common category: genetic




2247 most common category: Cardiovascular




2636 most common category: genetic




2637 most common category: genetic




2776 most common category: Aging




2777 most common category: Aging




434942 most common category: genetic




434978 most common category: genetic




492988 most common category: genetic




492994 most common category: Cardiovascular




492995 most common category: Cardiovascular




492996 most common category: Cardiovascular




2553 most common category: genetic




2696 most common category: Aging




434948 most common category: Aging




488960 most common category: Aging




492981 most common category: Aging




492987 most common category: genetic




504567 most common category: Aging




504572 most common category: Aging




504885 most common category: Aging




2779 most common category: Aging




2780 most common category: Aging




449723 most common category: Aging




2237 most common category: Cardiovascular




2426 most common category: genetic




2461 most common category: genetic




434937 most common category: genetic




434977 most common category: genetic




493211 most common category: genetic




434950 most common category: Aging




2227 most common category: Cardiovascular




2554 most common category: genetic




2555 most common category: genetic




434941 most common category: genetic




434952 most common category: Aging




434979 most common category: genetic




449724 most common category: Aging




493223 most common category: genetic




488965 most common category: genetic




493231 most common category: genetic




602389 most common category: genetic




623951 most common category: genetic




623985 most common category: genetic




623991 most common category: genetic




623993 most common category: genetic




624011 most common category: genetic




624016 most common category: genetic




624018 most common category: genetic




624020 most common category: genetic




624058 most common category: genetic




624064 most common category: genetic




624070 most common category: genetic




624072 most common category: genetic




624073 most common category: genetic




624074 most common category: genetic




624075 most common category: genetic




624102 most common category: genetic




624104 most common category: genetic




624105 most common category: genetic




624106 most common category: genetic




624107 most common category: genetic




624109 most common category: genetic




623870 most common category: Cancer




651703 most common category: genetic




651705 most common category: Cancer




720560 most common category: Cancer




720561 most common category: Cancer




720563 most common category: genetic




720564 most common category: genetic




2097 most common category: genetic




434954 most common category: genetic




623989 most common category: genetic




623998 most common category: genetic




2453 most common category: genetic




2456 most common category: genetic




1814 most common category: genetic




2098 most common category: Cancer




2382 most common category: Cancer




493083 most common category: Cancer




493085 most common category: Cancer




588827 most common category: Cancer




602266 most common category: Cancer




602268 most common category: Cancer




602269 most common category: Cancer




1910 most common category: Cancer




2089 most common category: Cancer




2486 most common category: Cancer




434951 most common category: Cancer




488804 most common category: Cancer




488805 most common category: Cancer




488820 most common category: Cancer




488843 most common category: Cancer




493180 most common category: Cancer




493193 most common category: Cancer




493195 most common category: Cancer




493213 most common category: Cancer




493225 most common category: Cancer




493227 most common category: Cancer




493228 most common category: Cancer




493234 most common category: Cancer




493235 most common category: Cancer




493236 most common category: Cancer




493237 most common category: Cancer




493238 most common category: Cancer




493239 most common category: Cancer




493249 most common category: Cancer




504323 most common category: Cancer




504324 most common category: Cancer




504331 most common category: Cancer




504588 most common category: Cancer




504597 most common category: Cancer




2723 most common category: Bacteria




2727 most common category: Bacteria




2728 most common category: Bacteria




2735 most common category: Bacteria




434943 most common category: Bacteria




493096 most common category: Bacteria




1832 most common category: genetic




493130 most common category: genetic




2739 most common category: genetic




449745 most common category: genetic




493250 most common category: genetic




743445 most common category: Cancer




1053173 most common category: Cancer




2704 most common category: Fungal




2695 most common category: Toxicity




2683 most common category: Toxicity




1875 most common category: Toxicity




2096 most common category: Toxicity




2525 most common category: Toxicity




2717 most common category: Cancer




449748 most common category: Cancer




463074 most common category: Cancer




504535 most common category: Cancer




504667 most common category: Cancer




493226 most common category: Cancer




504449 most common category: Cancer




493176 most common category: Cancer




504788 most common category: Cancer




1900 most common category: Bacteria




504351 most common category: genetic




504396 most common category: genetic




1662 most common category: Bacteria




1902 most common category: Bacteria




1914 most common category: genetic




2511 most common category: Cancer




2518 most common category: Cancer




2655 most common category: Cancer




493068 most common category: Cancer




2656 most common category: Cancer




2657 most common category: Cancer


In [5]:
#add empty strings to list to make it same length as dataframe
num_empty_strings = 1864 - len(disease_type_list)
empty_strings = [""] * num_empty_strings
padded_list = disease_type_list + empty_strings


In [6]:
#find the number of disease categories used 
num_of_unique_diseases=len([*set(disease_type_list)])
num_of_unique_diseases

16

In [7]:
#see what categories were used 
[*set(disease_type_list)]

['Toxicity',
 'Cardiovascular',
 'Obesity',
 'Infection',
 'Fungal',
 'Virus',
 'Bacteria',
 'autoimmune',
 'Parasite',
 'Respiratory',
 'Ocular',
 'genetic',
 'Neurological',
 'Aging',
 'Diabetes',
 'Cancer']

In [8]:
#add results to dataframe and save to csv 
df['Disease Type']=disease_type_list
df.to_csv('final_groups.csv', index=False)