# Checking correlation between variables per country

One of the goals of Team 6 was to show the correlation between different variables in the OWID dataset. By exploring the correlation we tried to find interesting patterns

## Correlation Heatmaps

We have selected five countries that in our opinion have the most varieties relative to each other. The five countries we chose are:
- The Netherlands (NLD)
- India (IND)
- The United States of America (USA)
- Brazil (BRA)
- Niger (NER)

In this analysis we looked at the new cases, new deaths, total cases and total deaths. We looked for correlations between one of these variables relative to four other variables. These four variables we picked are:
- New vaccinations
- ICU patients
- Hospital patients
- Stringency index

In [2]:
import pandas as pd
import matplotlib.pyplot as plt
import matplotlib.ticker as ticker
import seaborn as sb

pd.set_option('display.max_columns', None)

data = pd.read_csv(r"owid-covid-data.csv")
data = data.sort_values('date', ascending=True)
data['date'] = pd.to_datetime(data['date'], format = '%Y-%m-%d')
data_NLD = data[data.iso_code=='NLD']
data_IND = data[data.iso_code=='IND']
data_USA = data[data.iso_code=='USA']
data_BRA = data[data.iso_code=='BRA']
data_NER = data[data.iso_code=='NER']

## New cases and total cases in correlation to new vaccinations in the Netherlands

In [14]:
dfn = data_NLD[['new_cases', 'new_vaccinations_smoothed']]
corr = dfn.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,new_vaccinations_smoothed
new_cases,1.0,-0.410749
new_vaccinations_smoothed,-0.410749,1.0


In [15]:
dft = data_NLD[['total_cases', 'new_vaccinations_smoothed']]
corr = dft.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,new_vaccinations_smoothed
total_cases,1.0,0.933169
new_vaccinations_smoothed,0.933169,1.0


## New cases and total cases in correlation to new vaccinations in India

In [6]:
dfn = data_IND[['new_cases', 'new_vaccinations_smoothed']]
corr = dfn.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,new_vaccinations_smoothed
new_cases,1.0,0.411153
new_vaccinations_smoothed,0.411153,1.0


In [7]:
dft = data_IND[['total_cases', 'new_vaccinations_smoothed']]
corr = dft.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,new_vaccinations_smoothed
total_cases,1.0,0.60062
new_vaccinations_smoothed,0.60062,1.0


## New cases and total cases in correlation to new vaccinations in the USA

In [8]:
dfn = data_USA[['new_cases', 'new_vaccinations_smoothed']]
corr = dfn.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,new_vaccinations_smoothed
new_cases,1.0,-0.555605
new_vaccinations_smoothed,-0.555605,1.0


In [9]:
dft = data_USA[['total_cases', 'new_vaccinations_smoothed']]
corr = dft.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,new_vaccinations_smoothed
total_cases,1.0,0.625388
new_vaccinations_smoothed,0.625388,1.0


## New cases and total cases in correlation to new vaccinations in Brazil

In [10]:
dfn = data_BRA[['new_cases', 'new_vaccinations_smoothed']]
corr = dfn.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,new_vaccinations_smoothed
new_cases,1.0,0.235925
new_vaccinations_smoothed,0.235925,1.0


In [11]:
dft = data_BRA[['total_cases', 'new_vaccinations_smoothed']]
corr = dft.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,new_vaccinations_smoothed
total_cases,1.0,0.873887
new_vaccinations_smoothed,0.873887,1.0


## New cases and total cases in correlation to new vaccinations in Niger

In [12]:
dfn = data_NER[['new_cases', 'new_vaccinations_smoothed']]
corr = dfn.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,new_vaccinations_smoothed
new_cases,1.0,0.016462
new_vaccinations_smoothed,0.016462,1.0


In [13]:
dft = data_NER[['total_cases', 'new_vaccinations_smoothed']]
corr = dft.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,new_vaccinations_smoothed
total_cases,1.0,0.580976
new_vaccinations_smoothed,0.580976,1.0


## New deaths and total deaths in correlation to new vaccinations in the Netherlands

In [16]:
dfn = data_NLD[['new_deaths', 'new_vaccinations_smoothed']]
corr = dfn.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,new_vaccinations_smoothed
new_deaths,1.0,-0.709755
new_vaccinations_smoothed,-0.709755,1.0


In [17]:
dft = data_NLD[['total_deaths', 'new_vaccinations_smoothed']]
corr = dft.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,new_vaccinations_smoothed
total_deaths,1.0,0.840545
new_vaccinations_smoothed,0.840545,1.0


## New deaths and total deaths in correlation to new vaccinations in India

In [18]:
df = data_IND[['new_deaths', 'new_vaccinations_smoothed']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,new_vaccinations_smoothed
new_deaths,1.0,0.43799
new_vaccinations_smoothed,0.43799,1.0


In [19]:
df = data_IND[['total_deaths', 'new_vaccinations_smoothed']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,new_vaccinations_smoothed
total_deaths,1.0,0.587832
new_vaccinations_smoothed,0.587832,1.0


## New deaths and total deaths in correlation to new vaccinations in the USA

In [20]:
df = data_USA[['new_deaths', 'new_vaccinations_smoothed']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,new_vaccinations_smoothed
new_deaths,1.0,-0.513012
new_vaccinations_smoothed,-0.513012,1.0


In [21]:
df = data_USA[['total_deaths', 'new_vaccinations_smoothed']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,new_vaccinations_smoothed
total_deaths,1.0,0.652194
new_vaccinations_smoothed,0.652194,1.0


## New deaths and total deaths in correlation to new vaccinations in Brazil

In [22]:
df = data_BRA[['new_deaths', 'new_vaccinations_smoothed']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,new_vaccinations_smoothed
new_deaths,1.0,0.365747
new_vaccinations_smoothed,0.365747,1.0


In [23]:
df = data_BRA[['total_deaths', 'new_vaccinations_smoothed']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,new_vaccinations_smoothed
total_deaths,1.0,0.872504
new_vaccinations_smoothed,0.872504,1.0


## New deaths and total deaths in correlation to new vaccinations in Niger

In [24]:
df = data_NER[['new_deaths', 'new_vaccinations_smoothed']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,new_vaccinations_smoothed
new_deaths,1.0,-0.268573
new_vaccinations_smoothed,-0.268573,1.0


In [25]:
df = data_NER[['total_deaths', 'new_vaccinations_smoothed']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,new_vaccinations_smoothed
total_deaths,1.0,0.661186
new_vaccinations_smoothed,0.661186,1.0


## New cases and total cases in correlation to ICU-patients in the Netherlands

In [26]:
df = data_NLD[['new_cases', 'icu_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,icu_patients
new_cases,1.0,0.433373
icu_patients,0.433373,1.0


In [27]:
df = data_NLD[['total_cases', 'icu_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,icu_patients
total_cases,1.0,0.3839
icu_patients,0.3839,1.0


## New cases and total cases in correlation to ICU-patients in the USA

In [28]:
df = data_USA[['new_cases', 'icu_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,icu_patients
new_cases,1.0,0.921275
icu_patients,0.921275,1.0


In [29]:
df = data_USA[['total_cases', 'icu_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,icu_patients
total_cases,1.0,-0.110769
icu_patients,-0.110769,1.0


## New deaths and total deaths in correlation to ICU-patients in the Netherlands

In [30]:
df = data_NLD[['new_deaths', 'icu_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,icu_patients
new_deaths,1.0,0.733445
icu_patients,0.733445,1.0


In [31]:
df = data_NLD[['total_deaths', 'icu_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,icu_patients
total_deaths,1.0,0.261334
icu_patients,0.261334,1.0


## New deaths and total deaths in correlation to ICU-patients in the USA

In [32]:
df = data_USA[['new_deaths', 'icu_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,icu_patients
new_deaths,1.0,0.814095
icu_patients,0.814095,1.0


In [33]:
df = data_USA[['total_deaths', 'icu_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,icu_patients
total_deaths,1.0,-0.210298
icu_patients,-0.210298,1.0


## New cases and total cases in correlation to stringency-index in the Netherlands

In [243]:
df = data_NLD[['new_cases', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,stringency_index
new_cases,1.0,0.410543
stringency_index,0.410543,1.0


In [244]:
df = data_NLD[['total_cases', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,stringency_index
total_cases,1.0,0.457943
stringency_index,0.457943,1.0


## New cases and total cases in correlation to stringency-index in India

In [246]:
df = data_IND[['new_cases', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,stringency_index
new_cases,1.0,0.159435
stringency_index,0.159435,1.0


In [247]:
df = data_IND[['total_cases', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,stringency_index
total_cases,1.0,0.054831
stringency_index,0.054831,1.0


## New cases and total cases in correlation to stringency-index in the USA

In [125]:
df = data_USA[['new_cases', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,stringency_index
new_cases,1.0,0.437947
stringency_index,0.437947,1.0


In [249]:
df = data_USA[['total_cases', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,stringency_index
total_cases,1.0,0.132569
stringency_index,0.132569,1.0


## New cases and total cases in correlation to stringency-index in Brazil

In [126]:
df = data_BRA[['new_cases', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,stringency_index
new_cases,1.0,0.106676
stringency_index,0.106676,1.0


In [251]:
df = data_BRA[['total_cases', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,stringency_index
total_cases,1.0,-0.118439
stringency_index,-0.118439,1.0


## New cases and total cases in correlation to stringency-index in Niger

In [127]:
df = data_NER[['new_cases', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,stringency_index
new_cases,1.0,0.185808
stringency_index,0.185808,1.0


In [253]:
df = data_NER[['total_cases', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,stringency_index
total_cases,1.0,-0.09231
stringency_index,-0.09231,1.0


## New deaths and total deaths in correlation to stringency-index in the Netherlands

In [128]:
df = data_NLD[['new_deaths', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,stringency_index
new_deaths,1.0,0.565288
stringency_index,0.565288,1.0


In [255]:
df = data_NLD[['total_deaths', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,stringency_index
total_deaths,1.0,0.428466
stringency_index,0.428466,1.0


## New deaths and total deaths in correlation to stringency-index in India

In [129]:
df = data_IND[['new_deaths', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,stringency_index
new_deaths,1.0,0.12373
stringency_index,0.12373,1.0


In [256]:
df = data_IND[['total_deaths', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,stringency_index
total_deaths,1.0,-0.382255
stringency_index,-0.382255,1.0


## New deaths and total deaths in correlation to stringency-index in the USA

In [130]:
df = data_USA[['new_deaths', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,stringency_index
new_deaths,1.0,0.481009
stringency_index,0.481009,1.0


In [257]:
df = data_USA[['total_deaths', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,stringency_index
total_deaths,1.0,-0.193791
stringency_index,-0.193791,1.0


## New deaths and total deaths in correlation to stringency-index in Brazil

In [131]:
df = data_BRA[['new_deaths', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,stringency_index
new_deaths,1.0,-0.109759
stringency_index,-0.109759,1.0


In [258]:
df = data_BRA[['total_deaths', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,stringency_index
total_deaths,1.0,-0.592783
stringency_index,-0.592783,1.0


## New deaths and total deaths in correlation to stringency-index in Niger

In [132]:
df = data_NER[['new_deaths', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,stringency_index
new_deaths,1.0,0.299162
stringency_index,0.299162,1.0


In [259]:
df = data_NER[['total_deaths', 'stringency_index']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,stringency_index
total_deaths,1.0,-0.187062
stringency_index,-0.187062,1.0


## New cases and total cases in correlation to hospital patients in the Netherlands

In [133]:
df = data_NLD[['new_cases', 'hosp_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,hosp_patients
new_cases,1.0,0.534663
hosp_patients,0.534663,1.0


In [260]:
df = data_NLD[['total_cases', 'hosp_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,hosp_patients
total_cases,1.0,0.335063
hosp_patients,0.335063,1.0


## New cases and total cases in correlation to hospital patients in the USA

In [135]:
df = data_USA[['new_cases', 'hosp_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_cases,hosp_patients
new_cases,1.0,0.938287
hosp_patients,0.938287,1.0


In [261]:
df = data_USA[['total_cases', 'hosp_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_cases,hosp_patients
total_cases,1.0,-0.036164
hosp_patients,-0.036164,1.0


## New deaths and total deaths in correlation to hospital patients in the Netherlands

In [34]:
df = data_NLD[['new_deaths', 'hosp_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,hosp_patients
new_deaths,1.0,0.751637
hosp_patients,0.751637,1.0


In [35]:
df = data_NLD[['total_deaths', 'hosp_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,hosp_patients
total_deaths,1.0,0.206025
hosp_patients,0.206025,1.0


## New deaths and total deaths in correlation to hospital patients in the USA

In [36]:
df = data_USA[['new_deaths', 'hosp_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,new_deaths,hosp_patients
new_deaths,1.0,0.81647
hosp_patients,0.81647,1.0


In [37]:
df = data_USA[['total_deaths', 'hosp_patients']]
corr = df.corr()
corr.style.background_gradient(cmap='coolwarm', vmin=-1, vmax=1)

Unnamed: 0,total_deaths,hosp_patients
total_deaths,1.0,-0.135868
hosp_patients,-0.135868,1.0
