In [1]:
# Import SQL Alchemy
from sqlalchemy import create_engine
import pandas as pd
# Import and establish Base for which classes will be constructed 
from sqlalchemy.ext.declarative import declarative_base
Base = declarative_base()
from sqlalchemy.ext.automap import automap_base
from sqlalchemy.orm import Session
from sqlalchemy import create_engine, func
from sqlalchemy import create_engine, inspect
from config import username, password

# Import modules to declare columns and column data types
from sqlalchemy import Column, Integer, String, Float

In [2]:
# Create a connection to a SQLite database

engine = create_engine(f'postgresql://{username}:{password}@localhost:5432/ETL')

In [3]:
conn = engine.connect()

In [4]:
total_data = pd.read_sql("SELECT * FROM total", conn)
cancer_data = pd.read_sql("SELECT * FROM cancer", conn)
cerebro_data = pd.read_sql("SELECT * FROM cerebrovascular_disease", conn)
clrd_data = pd.read_sql("SELECT * FROM chronic_lower_respiratory_disease", conn)
dementia_data = pd.read_sql("SELECT * FROM dementia", conn)
diabetes_data = pd.read_sql("SELECT * FROM diabetes", conn)
heart_data = pd.read_sql("SELECT * FROM heart_disease", conn)
pneumonia_data = pd.read_sql("SELECT * FROM pneumonia", conn)
respiratory_data = pd.read_sql("SELECT * FROM respiratory_disease", conn)

In [5]:
total_data['COVID-19 new infections'] = total_data['COVID-19 new infections'].fillna(0).astype(int)
total_data.head()

Unnamed: 0,date,2015-19 range,COVID-19 new infections,2015-19 average deaths,2020-21 deaths
0,05-Jan-20,2452|2573,0,2498,2498
1,12-Jan-20,2369|2601,0,2490,2511
2,19-Jan-20,2368|2607,0,2465,2501
3,26-Jan-20,2328|2565,4,2446,2597
4,02-Feb-20,2270|2550,8,2451,2510


In [6]:
# dropping redundant columns
new_total_data = total_data.drop(['COVID-19 new infections'], axis=1)

#cleaning total_data table
#adding new columns of total and percent change
new_total_data['total change'] = new_total_data['2020-21 deaths'] - new_total_data['2015-19 average deaths']
new_total_data['percent total change'] = (new_total_data['2020-21 deaths'] / new_total_data['2015-19 average deaths']) * 100 - 100
new_total_data = new_total_data.round(2)

#renaming columns for future joins
new_total_data = new_total_data.rename({'2015-19 average deaths': '2015-19 avg total deaths',
                               '2020-21 deaths': '2020-21 total deaths'}, axis=1)

new_total_data.head()

Unnamed: 0,date,2015-19 range,2015-19 avg total deaths,2020-21 total deaths,total change,percent total change
0,05-Jan-20,2452|2573,2498,2498,0,0.0
1,12-Jan-20,2369|2601,2490,2511,21,0.84
2,19-Jan-20,2368|2607,2465,2501,36,1.46
3,26-Jan-20,2328|2565,2446,2597,151,6.17
4,02-Feb-20,2270|2550,2451,2510,59,2.41


In [7]:
#cleaning total_data table
#adding new columns of total and percent change
cancer_data['total change'] = cancer_data['2020-21 deaths'] - cancer_data['2015-19 average deaths']
cancer_data['percent total change'] = (cancer_data['2020-21 deaths'] / cancer_data['2015-19 average deaths']) * 100 - 100
cancer_data = cancer_data.round(2)

#renaming columns for future joins
cancer_data = cancer_data.rename({'2015-19 average deaths': '2015-19 avg cancer deaths',
                               '2020-21 deaths': '2020-21 cancer deaths'}, axis=1)

cancer_data.head()

Unnamed: 0,date,2015-19 range,2015-19 avg cancer deaths,2020-21 cancer deaths,total change,percent total change
0,05-Jan-20,847|906,868,849,-19,-2.19
1,12-Jan-20,817|917,869,899,30,3.45
2,19-Jan-20,853|915,874,912,38,4.35
3,26-Jan-20,806|942,870,931,61,7.01
4,02-Feb-20,762|933,864,830,-34,-3.94


In [8]:
#cleaning total_data table
#adding new columns of total and percent change
cerebro_data['total change'] = cerebro_data['2020-21 deaths'] - cerebro_data['2015-19 average deaths']
cerebro_data['percent total change'] = (cerebro_data['2020-21 deaths'] / cerebro_data['2015-19 average deaths']) * 100 - 100
cerebro_data = cerebro_data.round(2)

#renaming columns for future joins
cerebro_data = cerebro_data.rename({'2015-19 average deaths': '2015-19 cerebrovascular disease deaths',
                               '2020-21 deaths': '2020-21 cerebrovascular disease deaths'}, axis=1)

cerebro_data.head()

Unnamed: 0,date,2015-19 range,2015-19 cerebrovascular disease deaths,2020-21 cerebrovascular disease deaths,total change,percent total change
0,05-Jan-20,159|200,182,139,-43,-23.63
1,12-Jan-20,162|190,178,166,-12,-6.74
2,19-Jan-20,144|179,167,141,-26,-15.57
3,26-Jan-20,165|203,176,159,-17,-9.66
4,02-Feb-20,156|175,168,162,-6,-3.57


In [9]:
#cleaning total_data table
#adding new columns of total and percent change
clrd_data['total change'] = clrd_data['2020-21 deaths'] - clrd_data['2015-19 average deaths']
clrd_data['percent total change'] = (clrd_data['2020-21 deaths'] / clrd_data['2015-19 average deaths']) * 100 - 100
clrd_data = clrd_data.round(2)

#renaming columns for future joins
clrd_data = clrd_data.rename({'2015-19 average deaths': '2015-19 avg chronic lower respiratory disease deaths',
                               '2020-21 deaths': '2020-21 chronic lower respiratory disease deaths'}, axis=1)

clrd_data.head()

Unnamed: 0,date,2015-19 range,2015-19 avg chronic lower respiratory disease deaths,2020-21 chronic lower respiratory disease deaths,total change,percent total change
0,05-Jan-20,117|157,133,127,-6,-4.51
1,12-Jan-20,110|144,124,145,21,16.94
2,19-Jan-20,104|138,118,120,2,1.69
3,26-Jan-20,113|141,126,132,6,4.76
4,02-Feb-20,114|134,125,134,9,7.2


In [10]:
#cleaning total_data table
#adding new columns of total and percent change
dementia_data['total change'] = dementia_data['2020-21 deaths'] - dementia_data['2015-19 average deaths']
dementia_data['percent total change'] = (dementia_data['2020-21 deaths'] / dementia_data['2015-19 average deaths']) * 100 - 100
dementia_data = dementia_data.round(2)

#renaming columns for future joins
dementia_data = dementia_data.rename({'2015-19 average deaths': '2015-19 avg dementia deaths',
                               '2020-21 deaths': '2020-21 dementia deaths'}, axis=1)

dementia_data.head()

Unnamed: 0,date,2015-19 range,2015-19 avg dementia deaths,2020-21 dementia deaths,total change,percent total change
0,05-Jan-20,217|256,232,255,23,9.91
1,12-Jan-20,208|240,224,265,41,18.3
2,19-Jan-20,206|237,220,257,37,16.82
3,26-Jan-20,186|247,218,248,30,13.76
4,02-Feb-20,196|234,220,276,56,25.45


In [11]:
#cleaning total_data table
#adding new columns of total and percent change
diabetes_data['total change'] = diabetes_data['2020-21 deaths'] - diabetes_data['2015-19 average deaths']
diabetes_data['percent total change'] = (diabetes_data['2020-21 deaths'] / diabetes_data['2015-19 average deaths']) * 100 - 100
diabetes_data = diabetes_data.round(2)

#renaming columns for future joins
diabetes_data = diabetes_data.rename({'2015-19 average deaths': '2015-19 avg diabetes deaths',
                               '2020-21 deaths': '2020-21 diabetes deaths'}, axis=1)

diabetes_data.head()

Unnamed: 0,date,2015-19 range,2015-19 avg diabetes deaths,2020-21 diabetes deaths,total change,percent total change
0,05-Jan-20,66|78,71,86,15,21.13
1,12-Jan-20,69|79,74,71,-3,-4.05
2,19-Jan-20,74|97,83,71,-12,-14.46
3,26-Jan-20,62|99,80,77,-3,-3.75
4,02-Feb-20,63|88,78,80,2,2.56


In [12]:
#cleaning total_data table
#adding new columns of total and percent change
heart_data['total change'] = heart_data['2020-21 deaths'] - heart_data['2015-19 average deaths']
heart_data['percent total change'] = (heart_data['2020-21 deaths'] / heart_data['2015-19 average deaths']) * 100 - 100
heart_data = heart_data.round(2)

#renaming columns for future joins
heart_data = heart_data.rename({'2015-19 average deaths': '2015-19 avg heart disease deaths',
                               '2020-21 deaths': '2020-21 heart disease deaths'}, axis=1)

heart_data.head()

Unnamed: 0,date,2015-19 range,2015-19 avg heart disease deaths,2020-21 heart disease deaths,total change,percent total change
0,05-Jan-20,245|291,269,215,-54,-20.07
1,12-Jan-20,246|272,258,218,-40,-15.5
2,19-Jan-20,244|304,272,234,-38,-13.97
3,26-Jan-20,210|271,245,244,-1,-0.41
4,02-Feb-20,257|276,267,235,-32,-11.99


In [13]:
#cleaning total_data table
#adding new columns of total and percent change
pneumonia_data['total change'] = pneumonia_data['2020-21 deaths'] - pneumonia_data['2015-19 average deaths']
pneumonia_data['percent total change'] = (pneumonia_data['2020-21 deaths'] / pneumonia_data['2015-19 average deaths']) * 100 - 100
pneumonia_data = pneumonia_data.round(2)

#renaming columns for future joins
pneumonia_data = pneumonia_data.rename({'2015-19 average deaths': '2015-19 avg pneumonia deaths',
                               '2020-21 deaths': '2020-21 pneumonia deaths'}, axis=1)

pneumonia_data.head()

Unnamed: 0,date,2015-19 range,2015-19 avg pneumonia deaths,2020-21 pneumonia deaths,total change,percent total change
0,05-Jan-20,37|58,45,42,-3,-6.67
1,12-Jan-20,37|49,42,40,-2,-4.76
2,19-Jan-20,33|44,37,37,0,0.0
3,26-Jan-20,29|40,35,44,9,25.71
4,02-Feb-20,31|50,37,31,-6,-16.22


In [14]:
#cleaning total_data table
#adding new columns of total and percent change
respiratory_data['total change'] = respiratory_data['2020-21 deaths'] - respiratory_data['2015-19 average deaths']
respiratory_data['percent total change'] = (respiratory_data['2020-21 deaths'] / respiratory_data['2015-19 average deaths']) * 100 - 100
respiratory_data = respiratory_data.round(2)

#renaming columns for future joins
respiratory_data = respiratory_data.rename({'2015-19 average deaths': '2015-19 avg respiratory deaths',
                               '2020-21 deaths': '2020-21 respiratory disease deaths'}, axis=1)

respiratory_data.head()

Unnamed: 0,date,2015-19 range,2015-19 avg respiratory deaths,2020-21 respiratory disease deaths,total change,percent total change
0,05-Jan-20,215|263,233,240,7,3.0
1,12-Jan-20,203|251,220,240,20,9.09
2,19-Jan-20,193|233,206,222,16,7.77
3,26-Jan-20,197|242,218,242,24,11.01
4,02-Feb-20,200|229,219,226,7,3.2


In [15]:
data = [total_data["date"], cancer_data["2015-19 avg cancer deaths"], cerebro_data["2015-19 cerebrovascular disease deaths"], clrd_data["2015-19 avg chronic lower respiratory disease deaths"], dementia_data["2015-19 avg dementia deaths"], diabetes_data["2015-19 avg diabetes deaths"], heart_data["2015-19 avg heart disease deaths"], pneumonia_data["2015-19 avg pneumonia deaths"], respiratory_data["2015-19 avg respiratory deaths"]]
Deaths_Summary2015_19 = pd.DataFrame(data)
print(Deaths_Summary2015_19)

                                                           0          1   \
date                                                05-Jan-20  12-Jan-20   
2015-19 avg cancer deaths                                 868        869   
2015-19 cerebrovascular disease deaths                    182        178   
2015-19 avg chronic lower respiratory disease d...        133        124   
2015-19 avg dementia deaths                               232        224   
2015-19 avg diabetes deaths                                71         74   
2015-19 avg heart disease deaths                          269        258   
2015-19 avg pneumonia deaths                               45         42   
2015-19 avg respiratory deaths                            233        220   

                                                           2          3   \
date                                                19-Jan-20  26-Jan-20   
2015-19 avg cancer deaths                                 874        870   
2015-19 cer

In [16]:
Deaths_Summary2015_19 = Deaths_Summary2015_19.T
Deaths_Summary2015_19

Unnamed: 0,date,2015-19 avg cancer deaths,2015-19 cerebrovascular disease deaths,2015-19 avg chronic lower respiratory disease deaths,2015-19 avg dementia deaths,2015-19 avg diabetes deaths,2015-19 avg heart disease deaths,2015-19 avg pneumonia deaths,2015-19 avg respiratory deaths
0,05-Jan-20,868,182,133,232,71,269,45,233
1,12-Jan-20,869,178,124,224,74,258,42,220
2,19-Jan-20,874,167,118,220,83,272,37,206
3,26-Jan-20,870,176,126,218,80,245,35,218
4,02-Feb-20,864,168,125,220,78,267,37,219
...,...,...,...,...,...,...,...,...,...
56,31-Jan-21,870,176,126,218,80,245,35,218
57,07-Feb-21,864,168,125,220,78,267,37,219
58,14-Feb-21,858,165,119,224,85,265,35,212
59,21-Feb-21,858,170,118,226,75,250,43,216


In [17]:
data = [total_data["date"], new_total_data["2020-21 total deaths"], total_data["COVID-19 new infections"], cancer_data["2020-21 cancer deaths"], cancer_data["percent total change"], cerebro_data["2020-21 cerebrovascular disease deaths"], cerebro_data["percent total change"], clrd_data["2020-21 chronic lower respiratory disease deaths"], clrd_data["percent total change"], dementia_data["2020-21 dementia deaths"], dementia_data["percent total change"], diabetes_data["2020-21 diabetes deaths"], diabetes_data["percent total change"], heart_data["2020-21 heart disease deaths"], heart_data["percent total change"], pneumonia_data["2020-21 pneumonia deaths"], pneumonia_data["percent total change"], respiratory_data["2020-21 respiratory disease deaths"], respiratory_data["percent total change"]]
Deaths_Summary2020_21 = pd.DataFrame(data)
print(Deaths_Summary2020_21)

                                                         0          1   \
date                                              05-Jan-20  12-Jan-20   
2020-21 total deaths                                   2498       2511   
COVID-19 new infections                                   0          0   
2020-21 cancer deaths                                   849        899   
percent total change                                  -2.19       3.45   
2020-21 cerebrovascular disease deaths                  139        166   
percent total change                                 -23.63      -6.74   
2020-21 chronic lower respiratory disease deaths        127        145   
percent total change                                  -4.51      16.94   
2020-21 dementia deaths                                 255        265   
percent total change                                   9.91       18.3   
2020-21 diabetes deaths                                  86         71   
percent total change                  

In [18]:
Deaths_Summary2020_21 = Deaths_Summary2020_21.T
Deaths_Summary2020_21

Unnamed: 0,date,2020-21 total deaths,COVID-19 new infections,2020-21 cancer deaths,percent total change,2020-21 cerebrovascular disease deaths,percent total change.1,2020-21 chronic lower respiratory disease deaths,percent total change.2,2020-21 dementia deaths,percent total change.3,2020-21 diabetes deaths,percent total change.4,2020-21 heart disease deaths,percent total change.5,2020-21 pneumonia deaths,percent total change.6,2020-21 respiratory disease deaths,percent total change.7
0,05-Jan-20,2498,0,849,-2.19,139,-23.63,127,-4.51,255,9.91,86,21.13,215,-20.07,42,-6.67,240,3
1,12-Jan-20,2511,0,899,3.45,166,-6.74,145,16.94,265,18.3,71,-4.05,218,-15.5,40,-4.76,240,9.09
2,19-Jan-20,2501,0,912,4.35,141,-15.57,120,1.69,257,16.82,71,-14.46,234,-13.97,37,0,222,7.77
3,26-Jan-20,2597,4,931,7.01,159,-9.66,132,4.76,248,13.76,77,-3.75,244,-0.41,44,25.71,242,11.01
4,02-Feb-20,2510,8,830,-3.94,162,-3.57,134,7.2,276,25.45,80,2.56,235,-11.99,31,-16.22,226,3.2
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
56,31-Jan-21,2527,44,894,2.76,156,-11.36,113,-10.32,289,32.57,61,-23.75,221,-9.8,26,-25.71,211,-3.21
57,07-Feb-21,2650,39,926,7.18,165,-1.79,127,1.6,261,18.64,83,6.41,249,-6.74,37,0,231,5.48
58,14-Feb-21,2534,46,914,6.53,159,-3.64,107,-10.08,240,7.14,78,-8.24,250,-5.66,27,-22.86,199,-6.13
59,21-Feb-21,2512,25,907,5.71,174,2.35,110,-6.78,257,13.72,74,-1.33,208,-16.8,37,-13.95,197,-8.8


In [19]:
Deaths_Summary2020_21['Percentage of Total Deaths'] = (Deaths_Summary2020_21['2020-21 cancer deaths']/Deaths_Summary2020_21['2020-21 total deaths'])*100
Deaths_Summary2020_21 = Deaths_Summary2020_21.round(2)
Deaths_Summary2020_21

Unnamed: 0,date,2020-21 total deaths,COVID-19 new infections,2020-21 cancer deaths,percent total change,2020-21 cerebrovascular disease deaths,percent total change.1,2020-21 chronic lower respiratory disease deaths,percent total change.2,2020-21 dementia deaths,percent total change.3,2020-21 diabetes deaths,percent total change.4,2020-21 heart disease deaths,percent total change.5,2020-21 pneumonia deaths,percent total change.6,2020-21 respiratory disease deaths,percent total change.7,Percentage of Total Deaths
0,05-Jan-20,2498,0,849,-2.19,139,-23.63,127,-4.51,255,9.91,86,21.13,215,-20.07,42,-6.67,240,3,33.9872
1,12-Jan-20,2511,0,899,3.45,166,-6.74,145,16.94,265,18.3,71,-4.05,218,-15.5,40,-4.76,240,9.09,35.8025
2,19-Jan-20,2501,0,912,4.35,141,-15.57,120,1.69,257,16.82,71,-14.46,234,-13.97,37,0,222,7.77,36.4654
3,26-Jan-20,2597,4,931,7.01,159,-9.66,132,4.76,248,13.76,77,-3.75,244,-0.41,44,25.71,242,11.01,35.8491
4,02-Feb-20,2510,8,830,-3.94,162,-3.57,134,7.2,276,25.45,80,2.56,235,-11.99,31,-16.22,226,3.2,33.0677
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
56,31-Jan-21,2527,44,894,2.76,156,-11.36,113,-10.32,289,32.57,61,-23.75,221,-9.8,26,-25.71,211,-3.21,35.3779
57,07-Feb-21,2650,39,926,7.18,165,-1.79,127,1.6,261,18.64,83,6.41,249,-6.74,37,0,231,5.48,34.9434
58,14-Feb-21,2534,46,914,6.53,159,-3.64,107,-10.08,240,7.14,78,-8.24,250,-5.66,27,-22.86,199,-6.13,36.0695
59,21-Feb-21,2512,25,907,5.71,174,2.35,110,-6.78,257,13.72,74,-1.33,208,-16.8,37,-13.95,197,-8.8,36.1067


In [24]:
data = [cancer_data['date'], new_total_data['2015-19 avg total deaths'], cancer_data['2015-19 avg cancer deaths']]
cancer_data_2015_19 = pd.DataFrame(data)
cancer_data_2015_19 = cancer_data_2015_19.T
cancer_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg cancer deaths
0,05-Jan-20,2498,868
1,12-Jan-20,2490,869
2,19-Jan-20,2465,874
3,26-Jan-20,2446,870
4,02-Feb-20,2451,864
...,...,...,...
56,31-Jan-21,2446,870
57,07-Feb-21,2451,864
58,14-Feb-21,2456,858
59,21-Feb-21,2463,858


In [25]:
cancer_data_2015_19['Percentage of Total Deaths'] = (cancer_data_2015_19['2015-19 avg cancer deaths'] / cancer_data_2015_19['2015-19 avg total deaths']) * 100
cancer_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg cancer deaths,Percentage of Total Deaths
0,05-Jan-20,2498,868,34.7478
1,12-Jan-20,2490,869,34.8996
2,19-Jan-20,2465,874,35.4564
3,26-Jan-20,2446,870,35.5683
4,02-Feb-20,2451,864,35.2509
...,...,...,...,...
56,31-Jan-21,2446,870,35.5683
57,07-Feb-21,2451,864,35.2509
58,14-Feb-21,2456,858,34.9349
59,21-Feb-21,2463,858,34.8356


In [26]:
data = [cancer_data['date'], new_total_data['2020-21 total deaths'], cancer_data['2020-21 cancer deaths']]
cancer_data_2020_21 = pd.DataFrame(data)
cancer_data_2020_21 = cancer_data_2020_21.T
cancer_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 cancer deaths
0,05-Jan-20,2498,849
1,12-Jan-20,2511,899
2,19-Jan-20,2501,912
3,26-Jan-20,2597,931
4,02-Feb-20,2510,830
...,...,...,...
56,31-Jan-21,2527,894
57,07-Feb-21,2650,926
58,14-Feb-21,2534,914
59,21-Feb-21,2512,907


In [27]:
cancer_data_2020_21['Percentage of Total Deaths'] = (cancer_data_2020_21['2020-21 cancer deaths'] / cancer_data_2020_21['2020-21 total deaths']) * 100
cancer_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 cancer deaths,Percentage of Total Deaths
0,05-Jan-20,2498,849,33.9872
1,12-Jan-20,2511,899,35.8025
2,19-Jan-20,2501,912,36.4654
3,26-Jan-20,2597,931,35.8491
4,02-Feb-20,2510,830,33.0677
...,...,...,...,...
56,31-Jan-21,2527,894,35.3779
57,07-Feb-21,2650,926,34.9434
58,14-Feb-21,2534,914,36.0695
59,21-Feb-21,2512,907,36.1067


In [28]:
data = [new_total_data['date'], new_total_data['2015-19 avg total deaths'], cerebro_data['2015-19 cerebrovascular disease deaths']]
cerebro_data_2015_19 = pd.DataFrame(data)
cerebro_data_2015_19 = cerebro_data_2015_19.T
cerebro_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 cerebrovascular disease deaths
0,05-Jan-20,2498,182
1,12-Jan-20,2490,178
2,19-Jan-20,2465,167
3,26-Jan-20,2446,176
4,02-Feb-20,2451,168
...,...,...,...
56,31-Jan-21,2446,176
57,07-Feb-21,2451,168
58,14-Feb-21,2456,165
59,21-Feb-21,2463,170


In [29]:
cerebro_data_2015_19['Percentage of Total Deaths'] = (cerebro_data_2015_19['2015-19 cerebrovascular disease deaths'] / cerebro_data_2015_19['2015-19 avg total deaths']) * 100
cerebro_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 cerebrovascular disease deaths,Percentage of Total Deaths
0,05-Jan-20,2498,182,7.28583
1,12-Jan-20,2490,178,7.14859
2,19-Jan-20,2465,167,6.77485
3,26-Jan-20,2446,176,7.19542
4,02-Feb-20,2451,168,6.85435
...,...,...,...,...
56,31-Jan-21,2446,176,7.19542
57,07-Feb-21,2451,168,6.85435
58,14-Feb-21,2456,165,6.71824
59,21-Feb-21,2463,170,6.90215


In [30]:
data = [new_total_data['date'], new_total_data['2020-21 total deaths'], cerebro_data['2020-21 cerebrovascular disease deaths']]
cerebro_data_2020_21 = pd.DataFrame(data)
cerebro_data_2020_21 = cerebro_data_2020_21.T
cerebro_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 cerebrovascular disease deaths
0,05-Jan-20,2498,139
1,12-Jan-20,2511,166
2,19-Jan-20,2501,141
3,26-Jan-20,2597,159
4,02-Feb-20,2510,162
...,...,...,...
56,31-Jan-21,2527,156
57,07-Feb-21,2650,165
58,14-Feb-21,2534,159
59,21-Feb-21,2512,174


In [31]:
cerebro_data_2020_21['Percentage of Total Deaths'] = (cerebro_data_2020_21['2020-21 cerebrovascular disease deaths'] / cerebro_data_2020_21['2020-21 total deaths']) * 100
cerebro_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 cerebrovascular disease deaths,Percentage of Total Deaths
0,05-Jan-20,2498,139,5.56445
1,12-Jan-20,2511,166,6.61091
2,19-Jan-20,2501,141,5.63774
3,26-Jan-20,2597,159,6.12245
4,02-Feb-20,2510,162,6.45418
...,...,...,...,...
56,31-Jan-21,2527,156,6.17333
57,07-Feb-21,2650,165,6.22642
58,14-Feb-21,2534,159,6.27466
59,21-Feb-21,2512,174,6.92675


In [32]:
data = [new_total_data['date'], new_total_data['2015-19 avg total deaths'], clrd_data['2015-19 avg chronic lower respiratory disease deaths']]
clrd_data_2015_19 = pd.DataFrame(data)
clrd_data_2015_19 = clrd_data_2015_19.T
clrd_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg chronic lower respiratory disease deaths
0,05-Jan-20,2498,133
1,12-Jan-20,2490,124
2,19-Jan-20,2465,118
3,26-Jan-20,2446,126
4,02-Feb-20,2451,125
...,...,...,...
56,31-Jan-21,2446,126
57,07-Feb-21,2451,125
58,14-Feb-21,2456,119
59,21-Feb-21,2463,118


In [33]:
clrd_data_2015_19['Percentage of Total Deaths'] = (clrd_data_2015_19['2015-19 avg chronic lower respiratory disease deaths'] / clrd_data_2015_19['2015-19 avg total deaths']) * 100
clrd_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg chronic lower respiratory disease deaths,Percentage of Total Deaths
0,05-Jan-20,2498,133,5.32426
1,12-Jan-20,2490,124,4.97992
2,19-Jan-20,2465,118,4.78702
3,26-Jan-20,2446,126,5.15127
4,02-Feb-20,2451,125,5.09996
...,...,...,...,...
56,31-Jan-21,2446,126,5.15127
57,07-Feb-21,2451,125,5.09996
58,14-Feb-21,2456,119,4.84528
59,21-Feb-21,2463,118,4.79091


In [34]:
data = [new_total_data['date'], new_total_data['2020-21 total deaths'], clrd_data['2020-21 chronic lower respiratory disease deaths']]
clrd_data_2020_21 = pd.DataFrame(data)
clrd_data_2020_21 = clrd_data_2020_21.T
clrd_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 chronic lower respiratory disease deaths
0,05-Jan-20,2498,127
1,12-Jan-20,2511,145
2,19-Jan-20,2501,120
3,26-Jan-20,2597,132
4,02-Feb-20,2510,134
...,...,...,...
56,31-Jan-21,2527,113
57,07-Feb-21,2650,127
58,14-Feb-21,2534,107
59,21-Feb-21,2512,110


In [35]:
clrd_data_2020_21['Percentage of Total Deaths'] = (clrd_data_2020_21['2020-21 chronic lower respiratory disease deaths'] / clrd_data_2020_21['2020-21 total deaths']) * 100
clrd_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 chronic lower respiratory disease deaths,Percentage of Total Deaths
0,05-Jan-20,2498,127,5.08407
1,12-Jan-20,2511,145,5.77459
2,19-Jan-20,2501,120,4.79808
3,26-Jan-20,2597,132,5.08279
4,02-Feb-20,2510,134,5.33865
...,...,...,...,...
56,31-Jan-21,2527,113,4.47171
57,07-Feb-21,2650,127,4.79245
58,14-Feb-21,2534,107,4.22257
59,21-Feb-21,2512,110,4.37898


In [36]:
data = [new_total_data['date'], new_total_data['2015-19 avg total deaths'], dementia_data['2015-19 avg dementia deaths']]
dementia_data_2015_19 = pd.DataFrame(data)
dementia_data_2015_19 = dementia_data_2015_19.T
dementia_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg dementia deaths
0,05-Jan-20,2498,232
1,12-Jan-20,2490,224
2,19-Jan-20,2465,220
3,26-Jan-20,2446,218
4,02-Feb-20,2451,220
...,...,...,...
56,31-Jan-21,2446,218
57,07-Feb-21,2451,220
58,14-Feb-21,2456,224
59,21-Feb-21,2463,226


In [37]:
dementia_data_2015_19['Percentage of Total Deaths'] = (dementia_data_2015_19['2015-19 avg dementia deaths'] / dementia_data_2015_19['2015-19 avg total deaths']) * 100
dementia_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg dementia deaths,Percentage of Total Deaths
0,05-Jan-20,2498,232,9.28743
1,12-Jan-20,2490,224,8.99598
2,19-Jan-20,2465,220,8.92495
3,26-Jan-20,2446,218,8.91251
4,02-Feb-20,2451,220,8.97593
...,...,...,...,...
56,31-Jan-21,2446,218,8.91251
57,07-Feb-21,2451,220,8.97593
58,14-Feb-21,2456,224,9.12052
59,21-Feb-21,2463,226,9.1758


In [38]:
data = [new_total_data['date'], new_total_data['2020-21 total deaths'], dementia_data['2020-21 dementia deaths']]
dementia_data_2020_21 = pd.DataFrame(data)
dementia_data_2020_21 = dementia_data_2020_21.T
dementia_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 dementia deaths
0,05-Jan-20,2498,255
1,12-Jan-20,2511,265
2,19-Jan-20,2501,257
3,26-Jan-20,2597,248
4,02-Feb-20,2510,276
...,...,...,...
56,31-Jan-21,2527,289
57,07-Feb-21,2650,261
58,14-Feb-21,2534,240
59,21-Feb-21,2512,257


In [39]:
dementia_data_2020_21['Percentage of Total Deaths'] = (dementia_data_2020_21['2020-21 dementia deaths'] / dementia_data_2020_21['2020-21 total deaths']) * 100
dementia_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 dementia deaths,Percentage of Total Deaths
0,05-Jan-20,2498,255,10.2082
1,12-Jan-20,2511,265,10.5536
2,19-Jan-20,2501,257,10.2759
3,26-Jan-20,2597,248,9.54948
4,02-Feb-20,2510,276,10.996
...,...,...,...,...
56,31-Jan-21,2527,289,11.4365
57,07-Feb-21,2650,261,9.84906
58,14-Feb-21,2534,240,9.47119
59,21-Feb-21,2512,257,10.2309


In [41]:
data = [new_total_data['date'], new_total_data['2015-19 avg total deaths'], diabetes_data['2015-19 avg diabetes deaths']]
diabetes_data_2015_19 = pd.DataFrame(data)
diabetes_data_2015_19 = diabetes_data_2015_19.T
diabetes_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg diabetes deaths
0,05-Jan-20,2498,71
1,12-Jan-20,2490,74
2,19-Jan-20,2465,83
3,26-Jan-20,2446,80
4,02-Feb-20,2451,78
...,...,...,...
56,31-Jan-21,2446,80
57,07-Feb-21,2451,78
58,14-Feb-21,2456,85
59,21-Feb-21,2463,75


In [43]:
diabetes_data_2015_19['Percentage of Total Deaths'] = (diabetes_data_2015_19['2015-19 avg diabetes deaths'] / diabetes_data_2015_19['2015-19 avg total deaths']) * 100
diabetes_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg diabetes deaths,Percentage of Total Deaths
0,05-Jan-20,2498,71,2.84227
1,12-Jan-20,2490,74,2.97189
2,19-Jan-20,2465,83,3.36714
3,26-Jan-20,2446,80,3.27065
4,02-Feb-20,2451,78,3.18237
...,...,...,...,...
56,31-Jan-21,2446,80,3.27065
57,07-Feb-21,2451,78,3.18237
58,14-Feb-21,2456,85,3.46091
59,21-Feb-21,2463,75,3.04507


In [44]:
data = [new_total_data['date'], new_total_data['2020-21 total deaths'], diabetes_data['2020-21 diabetes deaths']]
diabetes_data_2020_21 = pd.DataFrame(data)
diabetes_data_2020_21 = diabetes_data_2020_21.T
diabetes_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 diabetes deaths
0,05-Jan-20,2498,86
1,12-Jan-20,2511,71
2,19-Jan-20,2501,71
3,26-Jan-20,2597,77
4,02-Feb-20,2510,80
...,...,...,...
56,31-Jan-21,2527,61
57,07-Feb-21,2650,83
58,14-Feb-21,2534,78
59,21-Feb-21,2512,74


In [45]:
diabetes_data_2020_21['Percentage of Total Deaths'] = (diabetes_data_2020_21['2020-21 diabetes deaths'] / diabetes_data_2020_21['2020-21 total deaths']) * 100
diabetes_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 diabetes deaths,Percentage of Total Deaths
0,05-Jan-20,2498,86,3.44275
1,12-Jan-20,2511,71,2.82756
2,19-Jan-20,2501,71,2.83886
3,26-Jan-20,2597,77,2.96496
4,02-Feb-20,2510,80,3.18725
...,...,...,...,...
56,31-Jan-21,2527,61,2.41393
57,07-Feb-21,2650,83,3.13208
58,14-Feb-21,2534,78,3.07814
59,21-Feb-21,2512,74,2.94586


In [46]:
data = [new_total_data['date'], new_total_data['2015-19 avg total deaths'], heart_data['2015-19 avg heart disease deaths']]
heart_data_2015_19 = pd.DataFrame(data)
heart_data_2015_19 = heart_data_2015_19.T
heart_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg heart disease deaths
0,05-Jan-20,2498,269
1,12-Jan-20,2490,258
2,19-Jan-20,2465,272
3,26-Jan-20,2446,245
4,02-Feb-20,2451,267
...,...,...,...
56,31-Jan-21,2446,245
57,07-Feb-21,2451,267
58,14-Feb-21,2456,265
59,21-Feb-21,2463,250


In [47]:
heart_data_2015_19['Percentage of Total Deaths'] = (heart_data_2015_19['2015-19 avg heart disease deaths'] / heart_data_2015_19['2015-19 avg total deaths']) * 100
heart_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg heart disease deaths,Percentage of Total Deaths
0,05-Jan-20,2498,269,10.7686
1,12-Jan-20,2490,258,10.3614
2,19-Jan-20,2465,272,11.0345
3,26-Jan-20,2446,245,10.0164
4,02-Feb-20,2451,267,10.8935
...,...,...,...,...
56,31-Jan-21,2446,245,10.0164
57,07-Feb-21,2451,267,10.8935
58,14-Feb-21,2456,265,10.7899
59,21-Feb-21,2463,250,10.1502


In [48]:
data = [new_total_data['date'], new_total_data['2020-21 total deaths'], heart_data['2020-21 heart disease deaths']]
heart_data_2020_21 = pd.DataFrame(data)
heart_data_2020_21 = heart_data_2020_21.T
heart_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 heart disease deaths
0,05-Jan-20,2498,215
1,12-Jan-20,2511,218
2,19-Jan-20,2501,234
3,26-Jan-20,2597,244
4,02-Feb-20,2510,235
...,...,...,...
56,31-Jan-21,2527,221
57,07-Feb-21,2650,249
58,14-Feb-21,2534,250
59,21-Feb-21,2512,208


In [49]:
heart_data_2020_21['Percentage of Total Deaths'] = (heart_data_2020_21['2020-21 heart disease deaths'] / heart_data_2020_21['2020-21 total deaths']) * 100
heart_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 heart disease deaths,Percentage of Total Deaths
0,05-Jan-20,2498,215,8.60689
1,12-Jan-20,2511,218,8.6818
2,19-Jan-20,2501,234,9.35626
3,26-Jan-20,2597,244,9.39546
4,02-Feb-20,2510,235,9.36255
...,...,...,...,...
56,31-Jan-21,2527,221,8.74555
57,07-Feb-21,2650,249,9.39623
58,14-Feb-21,2534,250,9.86582
59,21-Feb-21,2512,208,8.28025


In [51]:
data = [new_total_data['date'], new_total_data['2015-19 avg total deaths'], pneumonia_data['2015-19 avg pneumonia deaths']]
pneumonia_data_2015_19 = pd.DataFrame(data)
pneumonia_data_2015_19 = pneumonia_data_2015_19.T
pneumonia_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg pneumonia deaths
0,05-Jan-20,2498,45
1,12-Jan-20,2490,42
2,19-Jan-20,2465,37
3,26-Jan-20,2446,35
4,02-Feb-20,2451,37
...,...,...,...
56,31-Jan-21,2446,35
57,07-Feb-21,2451,37
58,14-Feb-21,2456,35
59,21-Feb-21,2463,43


In [52]:
pneumonia_data_2015_19['Percentage of Total Deaths'] = (pneumonia_data_2015_19['2015-19 avg pneumonia deaths'] / pneumonia_data_2015_19['2015-19 avg total deaths']) * 100
pneumonia_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg pneumonia deaths,Percentage of Total Deaths
0,05-Jan-20,2498,45,1.80144
1,12-Jan-20,2490,42,1.68675
2,19-Jan-20,2465,37,1.50101
3,26-Jan-20,2446,35,1.43091
4,02-Feb-20,2451,37,1.50959
...,...,...,...,...
56,31-Jan-21,2446,35,1.43091
57,07-Feb-21,2451,37,1.50959
58,14-Feb-21,2456,35,1.42508
59,21-Feb-21,2463,43,1.74584


In [53]:
data = [new_total_data['date'], new_total_data['2020-21 total deaths'], pneumonia_data['2020-21 pneumonia deaths']]
pneumonia_data_2020_21 = pd.DataFrame(data)
pneumonia_data_2020_21 = pneumonia_data_2020_21.T
pneumonia_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 pneumonia deaths
0,05-Jan-20,2498,42
1,12-Jan-20,2511,40
2,19-Jan-20,2501,37
3,26-Jan-20,2597,44
4,02-Feb-20,2510,31
...,...,...,...
56,31-Jan-21,2527,26
57,07-Feb-21,2650,37
58,14-Feb-21,2534,27
59,21-Feb-21,2512,37


In [54]:
pneumonia_data_2020_21['Percentage of Total Deaths'] = (pneumonia_data_2020_21['2020-21 pneumonia deaths'] / pneumonia_data_2020_21['2020-21 total deaths']) * 100
pneumonia_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 pneumonia deaths,Percentage of Total Deaths
0,05-Jan-20,2498,42,1.68135
1,12-Jan-20,2511,40,1.59299
2,19-Jan-20,2501,37,1.47941
3,26-Jan-20,2597,44,1.69426
4,02-Feb-20,2510,31,1.23506
...,...,...,...,...
56,31-Jan-21,2527,26,1.02889
57,07-Feb-21,2650,37,1.39623
58,14-Feb-21,2534,27,1.06551
59,21-Feb-21,2512,37,1.47293


In [55]:
data = [new_total_data['date'], new_total_data['2015-19 avg total deaths'], respiratory_data['2015-19 avg respiratory deaths']]
respiratory_data_2015_19 = pd.DataFrame(data)
respiratory_data_2015_19 = respiratory_data_2015_19.T
respiratory_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg respiratory deaths
0,05-Jan-20,2498,233
1,12-Jan-20,2490,220
2,19-Jan-20,2465,206
3,26-Jan-20,2446,218
4,02-Feb-20,2451,219
...,...,...,...
56,31-Jan-21,2446,218
57,07-Feb-21,2451,219
58,14-Feb-21,2456,212
59,21-Feb-21,2463,216


In [56]:
respiratory_data_2015_19['Percentage of Total Deaths'] = (respiratory_data_2015_19['2015-19 avg respiratory deaths'] / respiratory_data_2015_19['2015-19 avg total deaths']) * 100
respiratory_data_2015_19

Unnamed: 0,date,2015-19 avg total deaths,2015-19 avg respiratory deaths,Percentage of Total Deaths
0,05-Jan-20,2498,233,9.32746
1,12-Jan-20,2490,220,8.83534
2,19-Jan-20,2465,206,8.357
3,26-Jan-20,2446,218,8.91251
4,02-Feb-20,2451,219,8.93513
...,...,...,...,...
56,31-Jan-21,2446,218,8.91251
57,07-Feb-21,2451,219,8.93513
58,14-Feb-21,2456,212,8.63192
59,21-Feb-21,2463,216,8.76979


In [57]:
data = [new_total_data['date'], new_total_data['2020-21 total deaths'], respiratory_data['2020-21 respiratory disease deaths']]
respiratory_data_2020_21 = pd.DataFrame(data)
respiratory_data_2020_21 = respiratory_data_2020_21.T
respiratory_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 respiratory disease deaths
0,05-Jan-20,2498,240
1,12-Jan-20,2511,240
2,19-Jan-20,2501,222
3,26-Jan-20,2597,242
4,02-Feb-20,2510,226
...,...,...,...
56,31-Jan-21,2527,211
57,07-Feb-21,2650,231
58,14-Feb-21,2534,199
59,21-Feb-21,2512,197


In [58]:
respiratory_data_2020_21['Percentage of Total Deaths'] = (respiratory_data_2020_21['2020-21 respiratory disease deaths'] / respiratory_data_2020_21['2020-21 total deaths']) * 100
respiratory_data_2020_21

Unnamed: 0,date,2020-21 total deaths,2020-21 respiratory disease deaths,Percentage of Total Deaths
0,05-Jan-20,2498,240,9.60769
1,12-Jan-20,2511,240,9.55795
2,19-Jan-20,2501,222,8.87645
3,26-Jan-20,2597,242,9.31844
4,02-Feb-20,2510,226,9.00398
...,...,...,...,...
56,31-Jan-21,2527,211,8.34982
57,07-Feb-21,2650,231,8.71698
58,14-Feb-21,2534,199,7.8532
59,21-Feb-21,2512,197,7.84236
