In [2]:
import pandas as pd
import plotly.express as px
import matplotlib.pyplot as plt
import numpy as np
import seaborn as sns

#importing the linearized ATLAS phenotypic and demographic data (>1.5 GB)
atlas = pd.read_csv('atlas_2024.csv',low_memory=False)

In [None]:
antibiotics_groups = {
    'Amikacin': 'Aminoglycosides', 
    'Cefepime': 'Cephalosporins', 
    'Ceftazidime': 'Cephalosporins', 
    'Levofloxacin': 'Fluoroquinolones', 
    'Meropenem': 'Carbapenems',
    'Piperacillin tazobactam': 'Penicillins', 
    'Amoxycillin clavulanate': 'Penicillins', 
    'Ampicillin': 'Penicillins',
    'Ceftriaxone': 'Cephalosporins', 
    'Minocycline': 'Tetracycline', 
    'Tigecycline': 'Tetracycline', 
    'Linezolid': 'Oxazolidinones',
    'Vancomycin': 'Glycopeptides', 
    'Penicillin': 'Penicillins', 
    'Azithromycin': 'Macrolides', 
    'Clarithromycin': 'Macrolides',
    'Clindamycin': 'Lincosamide', 
    'Erythromycin': 'Macrolides', 
    'Metronidazole': 'Nitroimidazole', 
    'Cefoxitin': 'Cephalosporins',
    'Imipenem': 'Carbapenems', 
    'Ceftaroline': 'Cephalosporins', 
    'Ceftazidime avibactam': 'Cephalosporins',
    'Doripenem': 'Carbapenems', 
    'Ertapenem': 'Carbapenems', 
    'Moxifloxacin': 'Fluoroquinolones',
    'Oxacillin': 'Penicillins', 
    'Teicoplanin': 'Glycopeptides',
    'Ampicillin sulbactam':'Penicillins', 
    'Colistin': 'Colistin', 
    'Gentamicin': 'Aminoglycosides',
    'Cefixime': 'Cephalosporins', 
    'Ciprofloxacin': 'Fluoroquinolones', 
    'Tetracycline': 'Tetracycline',
    'Ceftolozane tazobactam': 'Cephalosporins', 
    'Meropenem vaborbactam': 'Carbapenems',
    'Aztreonam': "Monobactams (Aztreonam)", 
    'Daptomycin': 'Cyclic lipopeptides (Daptomycin)', 
    'Trimethoprim sulfa': 'Sulfonamides (Cotrimoxazole)',
    'Quinupristin dalfopristin': 'Streptogramin (Quinupristin dalfopristin)',
}

source_to_infection = {
    'Urine': 'Urinary Tract Infections (UTIs)',
    'Ear': 'Ear Infections',
    'Skin': 'Skin Infections',
    'Blood': 'Blood Infections',
    'Bronchus': 'Respiratory Infections',
    'Sputum': 'Respiratory Infections',
    'Lungs': 'Respiratory Infections',
    'Trachea': 'Respiratory Infections',
    'Respiratory: Other': 'Respiratory Infections',
    'Bronchiole': 'Respiratory Infections',
    'Endotracheal aspirate': 'Respiratory Infections',
    'Nasopharyngeal Aspirate': 'Respiratory Infections',
    'Transtracheal Aspirate': 'Respiratory Infections',
    'Nasotracheal Aspirate': 'Respiratory Infections',
    'Bronchoalveolar lavage': 'Respiratory Infections',
    'Brain': 'Central Nervous System (CNS) Infections',
    'Spinal Cord': 'Central Nervous System (CNS) Infections',
    'CSF': 'Central Nervous System (CNS) Infections',
    'Heart': 'Cardiovascular Infections',
    'Kidney': 'Urinary Tract Infections (UTIs)',
    'Bladder': 'Urinary Tract Infections (UTIs)',
    'Ureter': 'Urinary Tract Infections (UTIs)',
    'Urethra': 'Urinary Tract Infections (UTIs)',
    'Stomach': 'Intra-abdominal Infections',
    'Gastric Abscess': 'Intra-abdominal Infections',
    'Peritoneal Fluid': 'Intra-abdominal Infections',
    'Abdominal Fluid': 'Intra-abdominal Infections',
    'Pancreas': 'Intra-abdominal Infections',
    'Gall Bladder': 'Intra-abdominal Infections',
    'Liver': 'Intra-abdominal Infections',
    'Spleen': 'Intra-abdominal Infections',
    'Colon': 'Intra-abdominal Infections',
    'Wound': 'Soft Tissue Infections',
    'Decubitus': 'Soft Tissue Infections',
    'Ulcer': 'Soft Tissue Infections',
    'Cellulitis': 'Soft Tissue Infections',
    'Pyoderma Lesion': 'Soft Tissue Infections',
    'Genitourinary Infections': 'Genitourinary Infections',
}

In [None]:
atlas['antibiotics_class'] = atlas['Antibiotics'].map(antibiotics_groups)
atlas['infection type'] = atlas['Source'].map(source_to_infection)
atlas['Continents'] = atlas['Country'].map(countries_by_continent)

In [None]:
africa_data = atlas[atlas['Continents'] == 'Africa']

In [None]:
# List of ESKAPE-E pathogens and others
pathogens = [
    'Enterococcus faecium', 
    'Staphylococcus aureus', 
    'Klebsiella pneumoniae', 
    'Acinetobacter baumannii', 
    'Pseudomonas aeruginosa', 
    'Enterobacter cloacae'
    'Escherichia coli',
    'Streptococcus pneumoniae',
    'Haemophilus influenzae',
    'Neisseria gonorrhoeae'
]

africa_data = africa_data[africa_data['Species'].isin(pathogens)]
africa_data.to_csv('atlas_africa.csv',index=False)