In [1]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

In [2]:
immr = pd.read_csv('../data/processed/immr_processed_2019.csv')
immr.head(2)

Unnamed: 0,id,immr_code,disease,neon_live_male,child_1_4_live_male,child_5_16_live_male,adult_17_49_live_male,adult_50_69_live_male,adult_ab70_live_male,no_age_live_male,...,neon_dead_female,child_1_4_dead_female,child_5_16_dead_female,adult_17_49_dead_female,adult_50_69_dead_female,adult_ab70_dead_female,no_age_dead_female,total_dead_female,group_index,disease_group
0,1,1,Cholera (A00),0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,Certain Infectious and Parasitic Diseases
1,2,2,Typhoid and para typhoid fever (A01),5,34,91,145,57,20,0,...,0,0,0,0,0,0,0,0,0,Certain Infectious and Parasitic Diseases


In [3]:
immr['total_live_male'].sum()

3706458

In [4]:
immr['total_male'] = immr['total_live_male'] + immr['total_dead_male']
immr['total_female'] = immr['total_live_female'] + immr['total_dead_female']

In [5]:
total_male_patients_live = immr['total_live_male'].sum()
total_female_patients_live = immr['total_live_female'].sum()

total_male_patients_dead = immr['total_dead_male'].sum()
total_female_patients_dead = immr['total_dead_female'].sum()


all_males = total_male_patients_live + total_male_patients_dead
all_females = total_female_patients_live + total_female_patients_dead

In [6]:
print(f'Total male patients: {all_males}\nTotal Female Patients: {all_females}')

print(f'Ratio between male - female: {all_males / (all_males + all_females)} : {all_females / (all_males + all_females)}')

Total male patients: 3740535
Total Female Patients: 3737325
Ratio between male - female: 0.5002146335983825 : 0.4997853664016176


In [8]:

male_survival_rate = total_male_patients_live /(total_male_patients_live + total_male_patients_dead)
female_survival_rate = total_female_patients_live /(total_female_patients_live + total_female_patients_dead)

print(f'Male survival rate: {male_survival_rate * 100}%\nFemale Survival rate: {female_survival_rate * 100}%')

Male survival rate: 99.0889805870016%
Female Survival rate: 99.33377482557711%


In [9]:
group_sums = immr[['disease_group', 'group_index', 'total_live_male', 'total_dead_male', 'total_live_female', 'total_dead_female']].groupby('disease_group').sum()

In [10]:
group_sums['male_survival_rate'] = group_sums['total_live_male'] / (group_sums['total_live_male'] + group_sums['total_dead_male'])
group_sums['female_survival_rate'] = group_sums['total_live_female'] / (group_sums['total_live_female'] + group_sums['total_dead_female'])
group_sums

Unnamed: 0_level_0,group_index,total_live_male,total_dead_male,total_live_female,total_dead_female,male_survival_rate,female_survival_rate
disease_group,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
Certain Conditions Originating in the Perinatal Period,90,25497,652,25951,537,0.975066,0.979727
Certain Infectious and Parasitic Diseases,0,280737,3675,237656,3411,0.987079,0.98585
"Congenital Malformation, deformations and chromosomal abnormalities",96,7600,296,5078,283,0.962513,0.947211
Disease of the Blood and Blood-forming Organs and Certain Disorders involving the Imune Mechanism,8,26015,46,27414,66,0.998235,0.997598
Disease of the Circulatory System,152,207743,9567,190764,7592,0.955975,0.961725
Disease of the Digestive System,140,197843,1829,174246,850,0.99084,0.995146
Disease of the Genitourinary System,156,258412,1938,265897,1207,0.992556,0.995481
Disease of the Musculoskeletal and connctive tissue,72,107365,43,97060,59,0.9996,0.999392
Diseases of ear and mastoid process,21,29950,0,36545,0,1.0,1.0
Diseases of the Eye and Adnexa,36,94790,0,93880,0,1.0,1.0


#### most common diseases

In [11]:
#most common diseases
group_sums['total_male'] = group_sums['total_live_male'] + group_sums['total_dead_male']
group_sums['total_female'] = group_sums['total_live_female'] + group_sums['total_dead_female']


for women

In [12]:
most_female_diseases = group_sums.sort_values(by=['total_female'], ascending=False).head(5)[['total_live_female', 'total_dead_female', 'total_female']]
most_female_diseases

Unnamed: 0_level_0,total_live_female,total_dead_female,total_female
disease_group,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
Others,523442,1921,525363
"Pregnancy, Childbirth and the Puerperium",503768,41,503809
"Injury, Poisoning and Certain Other Consequences of External Causes",492312,901,493213
"Symptems, Signs and Abnormal Clinical and Laboratory findings, not elsewhere classified",381573,327,381900
Diseases of the Respiratory System,309258,4010,313268


In [13]:
group_sums.sort_values(by=['total_dead_female'], ascending=False).head(5)[['total_live_female', 'total_dead_female', 'total_female']]

Unnamed: 0_level_0,total_live_female,total_dead_female,total_female
disease_group,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
Disease of the Circulatory System,190764,7592,198356
Diseases of the Respiratory System,309258,4010,313268
Certain Infectious and Parasitic Diseases,237656,3411,241067
Neoplasams,88387,2834,91221
Others,523442,1921,525363


In [14]:
group_sums['individual_survival_female'] = group_sums['total_live_female']/(group_sums['total_female'])

In [15]:
group_sums.sort_values(by=['individual_survival_female'], ascending=True).head(5)[['total_live_female', 'total_dead_female', 'total_female', 'individual_survival_female']]

Unnamed: 0_level_0,total_live_female,total_dead_female,total_female,individual_survival_female
disease_group,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
"Congenital Malformation, deformations and chromosomal abnormalities",5078,283,5361,0.947211
Disease of the Circulatory System,190764,7592,198356,0.961725
Neoplasams,88387,2834,91221,0.968933
Certain Conditions Originating in the Perinatal Period,25951,537,26488,0.979727
Certain Infectious and Parasitic Diseases,237656,3411,241067,0.98585


for men

In [16]:
most_male_diseases = group_sums.sort_values(by=['total_male'], ascending=False).head(5)[['total_live_male', 'total_dead_male', 'total_male']]
most_male_diseases

Unnamed: 0_level_0,total_live_male,total_dead_male,total_male
disease_group,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
"Injury, Poisoning and Certain Other Consequences of External Causes",872299,2111,874410
Others,561308,3105,564413
"Symptems, Signs and Abnormal Clinical and Laboratory findings, not elsewhere classified",356716,390,357106
Diseases of the Respiratory System,332911,6074,338985
Certain Infectious and Parasitic Diseases,280737,3675,284412


In [17]:
group_sums.sort_values(by=['total_dead_male'], ascending=False).head(5)[['total_live_male', 'total_dead_male', 'total_male']]

Unnamed: 0_level_0,total_live_male,total_dead_male,total_male
disease_group,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
Disease of the Circulatory System,207743,9567,217310
Diseases of the Respiratory System,332911,6074,338985
Certain Infectious and Parasitic Diseases,280737,3675,284412
Neoplasams,68315,3462,71777
Others,561308,3105,564413


In [18]:
group_sums['individual_survival_male'] = group_sums['total_live_male']/(group_sums['total_male'])

In [19]:
group_sums.sort_values(by=['individual_survival_male'], ascending=True).head(5)[['total_live_male', 'total_dead_male', 'total_male', 'individual_survival_male']]

Unnamed: 0_level_0,total_live_male,total_dead_male,total_male,individual_survival_male
disease_group,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
Neoplasams,68315,3462,71777,0.951767
Disease of the Circulatory System,207743,9567,217310,0.955975
"Congenital Malformation, deformations and chromosomal abnormalities",7600,296,7896,0.962513
Certain Conditions Originating in the Perinatal Period,25497,652,26149,0.975066
Diseases of the Respiratory System,332911,6074,338985,0.982082


In [52]:
group_sums[group_sums.index == 'Neoplasams '].transpose()

disease_group,Neoplasams
group_index,34.0
total_live_male,68315.0
total_dead_male,3462.0
total_live_female,88387.0
total_dead_female,2834.0
male_survival_rate,0.951767
female_survival_rate,0.968933
total_male,71777.0
total_female,91221.0
individual_survival_female,0.968933


Child diseases

In [32]:
immr['neon_mortality_rate_male'] = immr['neon_dead_male'] / (immr['neon_live_male'] + immr['neon_dead_male'])
immr['child_14_mortality_rate_male'] = immr['child_1_4_dead_male'] / (immr['child_1_4_live_male'] + immr['child_1_4_dead_male'])
immr['child_516_mortality_rate_male'] = immr['child_5_16_dead_male'] / (immr['child_5_16_live_male'] + immr['child_5_16_dead_male'])

immr['neon_mortality_rate_female'] = immr['neon_dead_female'] / (immr['neon_live_female'] + immr['neon_dead_female'])
immr['child_14_mortality_rate_female'] = immr['child_1_4_dead_female'] / (immr['child_1_4_live_female'] + immr['child_1_4_dead_female'])
immr['child_516_mortality_rate_female'] = immr['child_5_16_dead_female'] / (immr['child_5_16_live_female'] + immr['child_5_16_dead_male'])

In [47]:
selected = 'child_516_mortality_rate_male'
immr.sort_values(by=selected, ascending=False)[['immr_code', 'disease', selected]].head(10)

Unnamed: 0,immr_code,disease,child_516_mortality_rate_male
76,59,"Malignant neoplasm of trachea, bronchus and lu...",0.272727
42,28,Rabies (A82),0.25
77,60,Malignant neoplasm of other respiratory and in...,0.25
25,21,Meningococcal infections (A39),0.1
160,132,Heart failure (I50),0.086957
162,134,Cerebroavascular disease (I60-I69),0.054945
26,22,"Septicaemia (A40,A41)",0.044747
91,74,Malignant neoplasm of brain (C71),0.043902
133,105,Intracranial and intraspinal abscess and granu...,0.043478
43,29,Viral encephalitis (includes Japanese Encephal...,0.032258


In [39]:
immr['gender_ratio_admit'] = immr['total_live_male']/immr['total_live_female']
immr['gender_ratio_mortal'] = immr['total_dead_male']/immr['total_dead_female']


What are the most male specific diseases 
!! filtering for inf done with < 1000

In [44]:
immr[immr['gender_ratio_admit'] < 1000].sort_values(by='gender_ratio_admit', ascending=False)[['immr_code', 'disease', 'gender_ratio_admit', 'gender_ratio_mortal']].head(10)

Unnamed: 0,immr_code,disease,gender_ratio_admit,gender_ratio_mortal
123,095,Mental and behavioural disorders due to use of...,18.111111,
75,058,Malignant neoplasm of larnyx (C32),10.243094,15.0
124,096,Mental and behavioural disorders due to other ...,9.752809,
40,026H,Unspecified sexually transmitted disease (A64),8.333333,
190,162,Alcoholic liver disease (K70),7.839506,10.933333
52,038A,Rubella (B06),7.0,
159,131,Cor pulmonale (I27.9),4.924731,1.102564
18,015,Leptospirosis (A27),4.80044,2.8
88,071,Malignant neoplasm of bladder (C67),4.554935,4.75
67,050,"Malignant neoplasm of lip, oral cavity and pha...",4.362053,4.719512


In [45]:
immr[immr['gender_ratio_mortal'] < 1000].sort_values(by='gender_ratio_mortal', ascending=False)[['immr_code', 'disease', 'gender_ratio_admit', 'gender_ratio_mortal']].head(20)

Unnamed: 0,immr_code,disease,gender_ratio_admit,gender_ratio_mortal
75,058,Malignant neoplasm of larnyx (C32),10.243094,15.0
266,236,Toxic effects of other pesticides (T60.1-T60.9),1.51332,14.333333
190,162,Alcoholic liver disease (K70),7.839506,10.933333
49,035,Varicella (Chickenpox) (B01),1.77894,8.0
177,149,"Bronchitis, emphysema and other chronic obstru...",4.242546,7.668874
265,235,Toxic effects of organophosphate and carbamate...,1.695253,5.05
19,016,Leprosy (A30),2.993007,5.0
88,071,Malignant neoplasm of bladder (C67),4.554935,4.75
67,050,"Malignant neoplasm of lip, oral cavity and pha...",4.362053,4.719512
79,062,Melanoma and other malignant neoplasm of skin ...,1.4,4.5
