In [2]:
import pandas as pd
import random
import datetime
import string
import pickle

In [3]:
# hospital addresses
addr = open('Data/addresses.txt')
addr_list = list(str(addr.read()).splitlines())
addr.close()

# hospital names
h_name = open('Data/hospital_names.txt')
hname_list = list(str(h_name.read()).splitlines())
h_name.close()

# hospital types
h_types = [
    'Acute care',
    'Addiction/substance abuse treatment',
    'Long-Term Care Hospital',
    'Psychiatric Hospital',
    'Rehabilitation Hospital',
    'Multi-specialization Hospital'
]

# doctor names
d_name = open('Data/doctor_names.txt')
dname_list = list(str(d_name.read()).splitlines())
d_name.close()

# doctor's specialization
d_type = open('Data/doctor_types.txt')
dtype_list = list(str(d_type.read()).splitlines())
d_type.close()

# phone numbers
ph_num = open('Data/contact_numbers.txt')
num_list = list(str(ph_num.read()).split('\n\n'))
ph_num.close()

# patient names
p_name = open('Data/patient_names.txt')
pname_list = list(str(p_name.read()).splitlines())
p_name.close()

# occupations
occ = open('Data/occupations.txt')
occ_list = list(str(occ.read()).splitlines())
occ.close()

# complaints
# comp = open('/home/sarthak/Desktop/Hackathon/complaints.txt')
# comp_list = list(str(comp.read()).splitlines())
# comp.close()

# chronic
chronic = open('Data/chronic_diseases.txt')
chronic_list = list(str(chronic.read()).splitlines())
chronic.close()

# disease_dict
with open('Data/disease_dict.pkl', 'rb') as f:
    disease_dict = pickle.load(f)

# surgeries
surg = open('Data/surgery_types.txt')
surg_list = list(str(surg.read()).splitlines())
surg.close()

# medication
med_df = pd.read_csv('Data/disease-medcation.csv')
med_df = med_df.dropna()

# auxiliary treatment
with open('Data/aux_dict.pkl', 'rb') as f:
    aux_dict = pickle.load(f)

In [4]:
# missing data
aux_dict['Heart attack'] = 'Medicines and tonics'
aux_dict['Allergy'] = 'Medicines and tonics'

## Hospital Table

- **h_id**: Contains a unique ID for the hospital
- **h_rno**: Contains hospital registeration number (might be redundant)
- **h_type/specialization**: Specialization of a hospital, should be 'none' if no specialization present
- **h_name**: Hospital name
- **no_doctors**: Number of doctors/surgeons present in the hospital
- **no_staff**: Number of staff present in the hospital
- **no_icus**: Number of ICUs present in the hospital
- **address**: Address of the hospital

In [5]:
hospital_dict = {
    'h_id':[],#primary key
    'h_rno':[],
    'h_name':[],
    'h_type':[],
    'no_doctors':[],
    'no_staff':[],
    'no_icus':[],
    'address':[]
}

hospital_df = pd.DataFrame(hospital_dict)





def random_long_num():
    return (''.join(random.SystemRandom().choice(string.ascii_letters) for _ in range(3))).upper()


for i in range(51):
    h_id = random.randint(1000,9000)
    h_rno = str(random_long_num()) + str(random.randint(100000,9999999))
    h_name = random.choice(hname_list)
    h_type = random.choice(h_types)
    no_doctors = random.randint(1,50)
    no_staff = random.randint(3,100)
    no_icus = random.randint(0,50)
    address = random.choice(addr_list)
    
    df_tmp = pd.DataFrame([(h_id,h_rno,h_name,h_type,no_doctors,no_staff,no_icus,address)],
                          columns=list(hospital_df.columns)
                         )
    hospital_df = hospital_df.append(df_tmp)
    
    
hospital_df = hospital_df.reset_index()
hospital_df = hospital_df.drop('index',axis=1)

In [6]:
hospital_df

Unnamed: 0,h_id,h_rno,h_name,h_type,no_doctors,no_staff,no_icus,address
0,1115.0,NFS7009675,Sacred Heart Clinic,Multi-specialization Hospital,3.0,36.0,29.0,"495 Flatbush Ave, Hartford CT 6106"
1,7691.0,HFK9745756,Greenlawn Medical Clinic,Addiction/substance abuse treatment,6.0,98.0,28.0,"515 Sawmill Road, West Haven CT 6516"
2,4409.0,WGJ7570303,Featherfall General Hospital,Rehabilitation Hospital,46.0,30.0,47.0,"8551 Whitfield Ave, Leeds AL 35094"
3,4250.0,QIV8187533,Green Hill Hospital,Multi-specialization Hospital,41.0,71.0,39.0,"200 Dutch Meadows Ln, Glenville NY 12302"
4,7366.0,VAX8892553,Silverwood Community Hospital,Long-Term Care Hospital,33.0,57.0,4.0,"495 Flatbush Ave, Hartford CT 6106"
5,1222.0,JOX3551909,Diamond Grove Community Hospital,Multi-specialization Hospital,32.0,16.0,50.0,"3371 S Alabama Ave, Monroeville AL 36460"
6,1545.0,NUU9849788,Repose Community Hospital,Addiction/substance abuse treatment,26.0,50.0,41.0,"2 Gannett Dr, Johnson City NY 13790"
7,8938.0,JBP5868131,West Valley General Hospital,Multi-specialization Hospital,41.0,7.0,21.0,"13858 Rt 31 W, Albion NY 14411"
8,5015.0,LEE1543243,Hope Valley Medical Center,Acute care,17.0,64.0,40.0,"135 Fairgrounds Memorial Pkwy, Ithaca NY 14850"
9,1439.0,TKP5353234,Rose Valley Hospital,Psychiatric Hospital,4.0,18.0,26.0,"3300 South Oates Street, Dothan AL 36301"


## Doctor Table

- **d_id**: Doctor's unique ID
- **d_name**: Doctor's name
- **specialization**: Doctor's specialization
- **office_no**: Office contact number of the doctor
- **mail_id**: Mail ID of the doctor
- **active_cases**: Number of active cases the doctor's working on

In [7]:
doctor_dict = {
    'h_id':[],#Forigen key
    'd_id':[],#Primary key
    'd_name':[],
    'specialization':[],
    'office_no':[],
    'mail_id':[],
    # 'active_cases':[], removed
    'timings':[],
}

doctor_df = pd.DataFrame(doctor_dict)




def random_time():
    beg = datetime.datetime(2020,12,1,00,00)
    curr = beg + datetime.timedelta(hours=random.randint(6,9)) + datetime.timedelta(minutes=random.choice([0,30]))
    return f'{curr.strftime("%H:%M")} - {(curr + datetime.timedelta(hours=1)).strftime("%H:%M")}' 

for i in range(51):
    h_id = hospital_df['h_id'][i]
    d_id = random.randint(1,30)
    d_name = random.choice(dname_list)
    specialization = random.choice(dtype_list)
    office_no = random.choice(num_list)
    mail_id = d_name.lower().replace(' ','_') + '@gmail.com' 
    timings = random_time()
    
    df_tmp = pd.DataFrame([(h_id,d_id,d_name,specialization,office_no,mail_id,timings)],
                         columns=list(doctor_df.columns))
    doctor_df = doctor_df.append(df_tmp)
    
    
doctor_df = doctor_df.reset_index()
doctor_df = doctor_df.drop('index',axis=1)

In [8]:
doctor_df

Unnamed: 0,h_id,d_id,d_name,specialization,office_no,mail_id,timings
0,1115.0,4.0,Dr. Howard Hrobsky,Pulmonologist,+1 206-874-9932,dr._howard_hrobsky@gmail.com,06:00 - 07:00
1,7691.0,29.0,Dr. Enrique Reimers,Hematologist,+1 332-800-9193,dr._enrique_reimers@gmail.com,09:00 - 10:00
2,4409.0,9.0,Dr. Alma Vopava,Dermatologist,+1 219-370-6752,dr._alma_vopava@gmail.com,06:30 - 07:30
3,4250.0,8.0,Dr. Delaney Garriga,Colon and Rectal Surgeon,+1 305-722-8372,dr._delaney_garriga@gmail.com,06:30 - 07:30
4,7366.0,2.0,Dr. Abraham Degooyer,Geriatric Medicine Specialist,+1 229-747-8219,dr._abraham_degooyer@gmail.com,08:00 - 09:00
5,1222.0,18.0,Dr. Skylar Schoener,Allergist/Immunologist,+1 423-734-0219,dr._skylar_schoener@gmail.com,08:30 - 09:30
6,1545.0,6.0,Dr. Cade Stokley,Osteopath,+1 310-797-9392,dr._cade_stokley@gmail.com,06:00 - 07:00
7,8938.0,28.0,Dr. Leroy Rabel,Radiologist,+1 310-998-1883,dr._leroy_rabel@gmail.com,08:00 - 09:00
8,5015.0,3.0,Dr. Julius Lifschitz,Physiatrist,+1 225-357-9127,dr._julius_lifschitz@gmail.com,09:30 - 10:30
9,1439.0,24.0,Dr. Miguel Woodland,Endocrinologist,+1 240-428-0729,dr._miguel_woodland@gmail.com,08:30 - 09:30


## Patient Personal Info Table

- **p_id**: Patient's ID
- **p_name**: Patient's name
- **dob**: DOB of the patient
- **dov**: Date of visit of the patient
- **gender**: Patient's gender
- **marital_status**: Marital status of the patient
- **occupation**: Current occupation of the patient
- **address**: Current address of the patient
- **contact_num**: Contact number of the patient
- **emergency_num**: Emergency contact number
- **adhaar**: Patient's adhaar number

In [9]:
patient_info_dict = {
   'd_id':[],#Foriegn key
    'p_id':[],#Primary
    'p_name':[],
    'dob':[],
    'dov':[],
    'gender':[],
    'marital_status':[],
    'occupation':[],
    'address':[],
    'contact_num':[],
    'emergency_num':[],
    # 'adhaar':[]
}

patient_info_df = pd.DataFrame(patient_info_dict)

from dateutil.relativedelta import relativedelta

def random_date(dtype):
    
    if dtype == 'dob':
        start = datetime.date(1920,1,1)
        y_inc = random.randint(10,100)
        
    else:
        start = datetime.date(1990,1,1)
        y_inc = random.randint(0,30)
        
    m_inc = random.randint(0,12)
    d_inc = random.randint(0,30)
        
    beg = start
    
    curr = beg + relativedelta(years=+y_inc) + relativedelta(months=+m_inc) + relativedelta(days=+d_inc)
    return curr.strftime("%y/%m/%d")

for i in range(51):
    d_id = doctor_df['d_id'][i]
    p_id = random.randint(1,999)
    p_name = random.choice(pname_list)
    dob = random_date('dob')
    dov = random_date('dov')
    gender = random.choice(['Male','Female'])
    marital_status = random.choice(['Married', 'Single', 'Divorced'])
    occupation = random.choice(occ_list)
    address = random.choice(addr_list)
    contact_num = random.choice(num_list)
    emergency_num = random.choice(num_list)
    # adhaar = str(random.randint(100000000000,999999999999))
    
    df_tmp = pd.DataFrame([(d_id,p_id,p_name,dob,dov,gender,marital_status,occupation,address,contact_num,emergency_num)],
                         columns=list(patient_info_df.columns))
    patient_info_df = patient_info_df.append(df_tmp)
    
    
patient_info_df = patient_info_df.reset_index()
patient_info_df= patient_info_df.drop('index',axis=1)

In [10]:
patient_info_df

Unnamed: 0,d_id,p_id,p_name,dob,dov,gender,marital_status,occupation,address,contact_num,emergency_num
0,4.0,420.0,Esmae Forrest,91/01/30,12/07/01,Male,Single,Radio & TV Newscaster,"1916 Center Point Rd, Center Point AL 35215",+1 208-687-4825,+1 201-636-4578
1,29.0,856.0,Sherman Hammond,92/01/12,96/01/07,Female,Married,Technological Espionage Intelligence Agent,"1501 Hwy 14 East, Selma AL 36703",+1 615-777-3018,+1 318-925-9688
2,9.0,42.0,Valeria Cordova,06/03/02,20/06/29,Male,Married,Forest Fire Inspector,"1501 Skyland Blvd E, Tuscaloosa AL 35405",+1 210-592-8941,+1 220-562-5024
3,8.0,36.0,Jerome Perkins,94/01/04,92/10/25,Male,Married,Photographic Process Workers,"1549 Rt 9, Halfmoon NY 12065",+1 215-654-9753,+1 203-554-1138
4,2.0,108.0,Alyson Mitchell,41/07/19,12/12/29,Female,Divorced,Cook (Restaurant),"141 Washington Ave Extension, Albany NY 12205",+1 281-404-6369,+1 225-589-0277
5,18.0,127.0,Lola Mcclain,10/11/09,90/03/06,Female,Married,Crop Workers Supervisor,"973 Gilbert Ferry Road Se, Attalla AL 35954",+1 202-830-6044,+1 443-499-6196
6,6.0,695.0,Jeff Levy,33/12/15,09/01/17,Female,Single,Zoologist,"601 Frank Stottile Blvd, Kingston NY 12401",+1 404-899-9061,+1 209-983-3611
7,28.0,993.0,Chasity Phillips,54/08/02,91/08/25,Male,Married,Tax Accountant,"4206 N College Ave, Jackson AL 36545",+1 229-747-8219,+1 714-952-0465
8,3.0,281.0,Fletcher Brooks,83/12/02,97/11/04,Female,Single,Technical Publications Writer,"2200 Sparkman Drive, Huntsville AL 35810",+1 201-636-4578,+1 518-726-0915
9,24.0,135.0,Gail Floyd,99/01/22,16/03/27,Male,Divorced,Newspaper/Magazines Writer,"6265 Brockport Spencerport Rd, Brockport NY 14420",+1 307-292-2852,+1 303-427-8734


## Pateint Medical Info

- **id**: Patient ID
- **comp_id**: Unique complaint ID
- **complaint**: Patient's main complaint
- **chronic**: Any chronic diseases
- **hist_cond**: Any disease/condition that runs in the family
- **habits**: Any habits, such as smoking, drinking, et cetera
- **weight**: Patient's weight
- **surgeries**: Past surgeries
- **allergies**: Known allergies

In [11]:
patient_med_dict = {
    'P_id': [],#Forignkey
    #'comp_id':[], remove this
    'complaint':[],
    'chronic':[],
    'fam_hist':[],
    'habits':[],
    'weight':[],
    'surgeries':[],
    'allergies':[]
}

patient_med_df = pd.DataFrame(patient_med_dict)

allerg_list = [None, 'Milk','Eggs','Fish','Shellfish','Tree nuts','Peanuts','Wheat','Soybeans', None]
habit_list = [None, None, 'Smoking', 'Drinking', 'Substance', 'Marijuana', 'Other']


complaints = []
for i in disease_dict.values():
    for j in i:
        complaints.append(j)

        

for i in range(51):
    p_id = patient_info_df['p_id'][i]
    complaint = random.choice(complaints)
    chronic = random.choice(chronic_list)
    fam_hist = random.choice(chronic_list)
    habits = random.choice(habit_list)
    weight = random.randint(10,150)
    surgeries = random.choice(surg_list)
    allergies = random.choice(allerg_list)
    
    df_tmp = pd.DataFrame([(p_id,complaint,chronic,fam_hist,habits,weight,surgeries,allergies)],
                         columns=list(patient_med_df.columns))
    patient_med_df = patient_med_df.append(df_tmp)
    
    
patient_med_df = patient_med_df.reset_index()
patient_med_df = patient_med_df.drop('index',axis=1)

In [12]:
patient_med_df

Unnamed: 0,P_id,complaint,chronic,fam_hist,habits,weight,surgeries,allergies
0,420.0,skin_rash,Atherosclerosis,Rheumatoid arthritis,Drinking,52.0,Prostatectomy,Soybeans
1,856.0,painful_walking,Asthma,Crohn's disease,Other,48.0,Tonsillectomy,Shellfish
2,42.0,high_fever,Atherosclerosis,Dysrhythmia (irregular heartbeat),,12.0,Partial colectomy,Shellfish
3,36.0,high_fever,Bipolar mood disease,Chronic kidney disease,Substance,34.0,Hysterectomy,Fish
4,108.0,stomach_pain,Glaucoma,Rheumatoid arthritis,Marijuana,28.0,Tonsillectomy,Milk
5,127.0,abdominal_pain,Hypothyroidism (inactive thyroid gland),Hypertension (high blood pressure),Marijuana,113.0,Appendectomy,
6,695.0,high_fever,Multiple sclerosis,Schizophrenia,Drinking,118.0,Prostatectomy,Wheat
7,993.0,nausea,Rheumatoid arthritis,Diabetes mellitus (type 1 and type 2),,132.0,Coronary artery bypass,
8,281.0,diarrhoea,Systemic lupus erythematosis,Coronary artery disease,Marijuana,35.0,Cesarean section,
9,135.0,muscle_weakness,Chronic obstructive pulmonary disease,Systemic lupus erythematosis,Other,83.0,Prostatectomy,Peanuts


## Patient Diagnosis

- **comp_id**: Complaint ID
- **diag_id**: Diagnosis ID
- **diag_date**: Diagnosis date
- **diagnosis**: Diagnosis of the patient
- **lab_test_1_id**: Lab test 1 ID (does not require picture of reports)
- **lab_test_2_id**: Lab test 2 ID (requires picture of report)
- **pres_id**: Prescription ID for the diagnosis
- **d_id**: ID of the doctor who diagnosed
- **surg_req**: Surgery required or not

In [13]:
diagnosis_dict = {
    'P_Id':[],#foriegn key
    #'comp_id': [],remove this
    #'diag_id':[],remove
    'diag_date':[],
    'diagnosis':[],
#     'lab_test_1_id':[],
#     'lab_test_2_id':[],
    #'pres_id':[],remove
    #'d_id':[],Remove
    'surg_req':[],
}

diagnosis_df = pd.DataFrame(diagnosis_dict)



for i in range(51):
    p_id = patient_info_df['p_id'][i]
    diag_date = patient_info_df['dov'][i]
    diagnosis = random.choice(list(disease_dict.keys()))
    surg_req = random.choice(['Yes','No'])
    
    df_tmp = pd.DataFrame([(p_id,diag_date,diagnosis,surg_req)],
                         columns=list(diagnosis_df.columns))
    diagnosis_df = diagnosis_df.append(df_tmp)
    
    
diagnosis_df = diagnosis_df.reset_index()
diagnosis_df = diagnosis_df.drop('index',axis=1)

In [14]:
diagnosis_df

Unnamed: 0,P_Id,diag_date,diagnosis,surg_req
0,420.0,12/07/01,Drug Reaction,Yes
1,856.0,96/01/07,Chronic cholestasis,No
2,42.0,20/06/29,Dimorphic hemmorhoids(piles),Yes
3,36.0,92/10/25,Common Cold,Yes
4,108.0,12/12/29,Peptic ulcer diseae,No
5,127.0,90/03/06,Osteoarthristis,No
6,695.0,09/01/17,AIDS,Yes
7,993.0,91/08/25,Hepatitis C,Yes
8,281.0,97/11/04,Hypothyroidism,Yes
9,135.0,16/03/27,Typhoid,No


## Prescription

- **pres_id**: Prescription ID
- **d_id**: Doctor's ID
- **p_id**: Patient's ID
- **mediacation**: [name] - [dosage] - [interval] (can be multiple)
- **aux_treatment**: Auxiliary treatmnet
- **follow_up**: Follow up date (date)
- **referral**: Referrals, if any

In [15]:
prescription_dict = {
    'pres_id': [],
    'd_id':[],#Foriegn key
    'p_id':[],
    'medication':[],
    'aux_treatment':[],
    'follow_up':[],
    'referrals':[]
}

prescription_df = pd.DataFrame(prescription_dict)


med_list = []
for i in diagnosis_df['diagnosis']:
    tmp_list = list(med_df[med_df['DISEASE'] == i]['Medication'])
    if len(tmp_list) == 0:
        med_list.append('tablets and a syrup')
        continue
    med_list.append(tmp_list[0])



for i in range(51):
    pres_id = random.randint(20,999)
    d_id = doctor_df['d_id'][i]
    p_id = patient_info_df['p_id'][i]
    medication = med_list[i]
    aux_treatment = str(aux_dict[diagnosis_df['diagnosis'][i]])
    follow_up = f'{random.randint(10,30)} days'
    referrals = random.choice(dname_list)
    
    df_tmp = pd.DataFrame([(pres_id,d_id,p_id,medication,aux_treatment,follow_up,referrals)],
                         columns=list(prescription_df.columns))
    prescription_df = prescription_df.append(df_tmp)
    
    
prescription_df = prescription_df.reset_index()
prescription_df = prescription_df.drop('index', axis=1)

In [16]:
prescription_df

Unnamed: 0,pres_id,d_id,p_id,medication,aux_treatment,follow_up,referrals
0,975.0,4.0,420.0,prednisone,"['follow up', 'consult nearest hospital', 'sto...",12 days,Dr. Summer Muhs
1,110.0,29.0,856.0,tablets and a syrup,"['eat healthy', 'consult doctor', 'cold baths']",23 days,Dr. Blake Henion
2,706.0,9.0,42.0,tablets and a syrup,"['warm bath with epsom salt', 'avoid fatty spi...",17 days,Dr. Brycen Fannell
3,401.0,8.0,36.0,Augmentin,"['take vapour', 'keep fever in check', 'avoid ...",27 days,Dr. Wesley Soltes
4,975.0,2.0,108.0,tablets and a syrup,"['consume probiotic food', 'limit alcohol', 'a...",19 days,Dr. Karter Meinerding
5,359.0,18.0,127.0,tablets and a syrup,"['acetaminophen', 'consult nearest hospital', ...",16 days,Dr. Alberto Nizo
6,959.0,6.0,695.0,clindamycin HCl,"['avoid open cuts', 'consult doctor', 'follow ...",13 days,Dr. Andrew Camps
7,647.0,28.0,993.0,interferon alfa-2b Solution,"['medication', 'vaccination', 'Consult nearest...",15 days,Dr. Andrew Camps
8,864.0,3.0,281.0,Synthroid,"['eat healthy', 'exercise', 'get proper sleep']",23 days,Dr. Leo Adhami
9,863.0,24.0,135.0,doxycycline hyclate,"['antiboitic therapy', 'consult doctor', 'medi...",14 days,Dr. Erick Rengifo


## Lab Tests - 1

- **test_1_id**: Lab test 1 ID
- **bl_test**: Blood test results
- **micro_test**: Microbiology test results
- **cyt_test**: Cytology test results
- **hi_p_test**: Histo-pathology test results
- **cyg_test**: Cytogenetics test results
- **ur_test**: Urine test results

In [17]:
lab_test_1_dict = {
    'p_id':[],#Forigen key
    #'test_1_id':[],remove
    'bl_test':[],
    'micro_test':[],
    'cyt_test':[],
    'hl_p_test':[],
    'cyg_test':[],
    'ur_test':[]
}

lab_test_1_df = pd.DataFrame(lab_test_1_dict)


bl_results = ['Low WBC count','Low RBC count','Normal']
micro_results = ['Normal']
cyt_results = ['Normal']
hi_p_results = ['Normal']
cyg_results = ['Normal']
ur_results = ['Normal']




for i in range(51):
    p_id = patient_info_df['p_id'][i]
    bl_test = random.choice(bl_results)
    micro_test = random.choice(micro_results)
    cyt_test = random.choice(cyt_results)
    hi_p_test = random.choice(hi_p_results)
    cyg_test = random.choice(cyg_results)
    ur_test = random.choice(ur_results)
    
    df_tmp = pd.DataFrame([(p_id,bl_test,micro_test,cyt_test,hi_p_test,cyg_test,ur_test)],
                         columns=list(lab_test_1_df.columns))
    lab_test_1_df = lab_test_1_df.append(df_tmp)
    
    
lab_test_1_df = lab_test_1_df.reset_index()
lab_test_1_df = lab_test_1_df.drop('index',axis=1)

In [18]:
lab_test_1_df

Unnamed: 0,p_id,bl_test,micro_test,cyt_test,hl_p_test,cyg_test,ur_test
0,420.0,Low RBC count,Normal,Normal,Normal,Normal,Normal
1,856.0,Low RBC count,Normal,Normal,Normal,Normal,Normal
2,42.0,Low WBC count,Normal,Normal,Normal,Normal,Normal
3,36.0,Low RBC count,Normal,Normal,Normal,Normal,Normal
4,108.0,Normal,Normal,Normal,Normal,Normal,Normal
5,127.0,Normal,Normal,Normal,Normal,Normal,Normal
6,695.0,Low WBC count,Normal,Normal,Normal,Normal,Normal
7,993.0,Normal,Normal,Normal,Normal,Normal,Normal
8,281.0,Normal,Normal,Normal,Normal,Normal,Normal
9,135.0,Low WBC count,Normal,Normal,Normal,Normal,Normal


## Lab Tests - 2

- **test_2_id**: Test ID
- **xray_results**: [img] report of X-Ray scan
- **mri_results**: [img] report if MRI scan
- **ct_results**: [img] report of CT scan
- **us_results**: [img] report of Ultra Sound scan

In [19]:
# INCOMPLETE

lab_test_2_dict = {
    'p_id':[],#Forigen key
    #'test_2_id':[],Remove
    'xray_results':[],
    'mri_results':[],
    'ct_results':[],
    'us_results':[]
}

lab_test_2_df = pd.DataFrame(lab_test_2_dict)