# R-Initialization

### R-Package Download

In [18]:
library(ggplot2) # For Plot Visualizations
library(car) # For Variance Inflation Factor function -- vif()
library(corrplot) # For Correlation Visualizations
library(data.table) # For Complex Data Frame Joins

# Data Initialization

### Data Download

In [23]:
# Downloading Vaccination Data
vaccinations = read.csv(url(paste0("https://raw.githubusercontent.com/owid/covid-19-data/master/public/data/vaccinations/vaccinations.csv")))

# Downloading Testing Data
testing = read.csv(url(paste0("https://raw.githubusercontent.com/owid/covid-19-data/master/public/data/testing/covid-testing-all-observations.csv")))

# Downloading Hospitalization Data
hospitalization = read.csv(url(paste0("https://raw.githubusercontent.com/owid/covid-19-data/master/public/data/hospitalizations/covid-hospitalizations.csv")))

# Downloading Hospitalization Data
deaths = read.csv(url(paste0("https://raw.githubusercontent.com/owid/covid-19-data/master/public/data/jhu/full_data.csv")))



In [24]:
head(vaccinations)
head(testing)
head(hospitalization)
head(deaths)

location,iso_code,date,total_vaccinations,people_vaccinated,people_fully_vaccinated,total_boosters,daily_vaccinations_raw,daily_vaccinations,total_vaccinations_per_hundred,people_vaccinated_per_hundred,people_fully_vaccinated_per_hundred,total_boosters_per_hundred,daily_vaccinations_per_million,daily_people_vaccinated,daily_people_vaccinated_per_hundred
Afghanistan,AFG,2021-02-22,0.0,0.0,,,,,0.0,0.0,,,,,
Afghanistan,AFG,2021-02-23,,,,,,1367.0,,,,,33.0,1367.0,0.003
Afghanistan,AFG,2021-02-24,,,,,,1367.0,,,,,33.0,1367.0,0.003
Afghanistan,AFG,2021-02-25,,,,,,1367.0,,,,,33.0,1367.0,0.003
Afghanistan,AFG,2021-02-26,,,,,,1367.0,,,,,33.0,1367.0,0.003
Afghanistan,AFG,2021-02-27,,,,,,1367.0,,,,,33.0,1367.0,0.003


Entity,ISO.code,Date,Source.URL,Source.label,Notes,Cumulative.total,Daily.change.in.cumulative.total,Cumulative.total.per.thousand,Daily.change.in.cumulative.total.per.thousand,X7.day.smoothed.daily.change,X7.day.smoothed.daily.change.per.thousand,Short.term.positive.rate,Short.term.tests.per.case
Afghanistan - tests performed,AFG,2022-01-29,http://www.emro.who.int/images/stories/coronavirus/covid-sitrep-28.pdf,WHO Regional Office for the Eastern Mediterranean,,853003.0,,21.272,,,,,
Afghanistan - tests performed,AFG,2022-01-30,,,,,,,,,,,
Afghanistan - tests performed,AFG,2022-01-31,,,,,,,,,,,
Afghanistan - tests performed,AFG,2022-02-01,,,,,,,,,,,
Afghanistan - tests performed,AFG,2022-02-02,,,,,,,,,,,
Afghanistan - tests performed,AFG,2022-02-03,,,,,,,,,,,


entity,iso_code,date,indicator,value
Algeria,DZA,2020-07-17,Daily ICU occupancy,62.0
Algeria,DZA,2020-07-17,Daily ICU occupancy per million,1.381
Algeria,DZA,2020-07-18,Daily ICU occupancy,67.0
Algeria,DZA,2020-07-18,Daily ICU occupancy per million,1.492
Algeria,DZA,2020-07-20,Daily ICU occupancy,64.0
Algeria,DZA,2020-07-20,Daily ICU occupancy per million,1.425


date,location,new_cases,new_deaths,total_cases,total_deaths,weekly_cases,weekly_deaths,biweekly_cases,biweekly_deaths
2020-02-24,Afghanistan,5,,5,,,,,
2020-02-25,Afghanistan,0,,5,,,,,
2020-02-26,Afghanistan,0,,5,,,,,
2020-02-27,Afghanistan,0,,5,,,,,
2020-02-28,Afghanistan,0,,5,,,,,
2020-02-29,Afghanistan,0,,5,,5.0,,,


### Data Cleanup

In [26]:
testing <- transform(testing, location=sub(" .*", "", Entity))

head(testing)

Entity,ISO.code,Date,Source.URL,Source.label,Notes,Cumulative.total,Daily.change.in.cumulative.total,Cumulative.total.per.thousand,Daily.change.in.cumulative.total.per.thousand,X7.day.smoothed.daily.change,X7.day.smoothed.daily.change.per.thousand,Short.term.positive.rate,Short.term.tests.per.case,location
Afghanistan - tests performed,AFG,2022-01-29,http://www.emro.who.int/images/stories/coronavirus/covid-sitrep-28.pdf,WHO Regional Office for the Eastern Mediterranean,,853003.0,,21.272,,,,,,Afghanistan
Afghanistan - tests performed,AFG,2022-01-30,,,,,,,,,,,,Afghanistan
Afghanistan - tests performed,AFG,2022-01-31,,,,,,,,,,,,Afghanistan
Afghanistan - tests performed,AFG,2022-02-01,,,,,,,,,,,,Afghanistan
Afghanistan - tests performed,AFG,2022-02-02,,,,,,,,,,,,Afghanistan
Afghanistan - tests performed,AFG,2022-02-03,,,,,,,,,,,,Afghanistan


# Data Analyses

### Method 1:

We are looking purely at the deaths as a function of everything else. This being `Date`, `Location`, `Daily Testing`, `Daily ICU Occipancy`. We are looking at this as a density, to allow for better comparison between countries of different population magnitudes. We merge our data into a set:

In [13]:
data.method1 = setDT(deaths)[setDT(vaccinations),on=c("location","date")]
head(data.method1)

date,location,new_cases,new_deaths,total_cases,total_deaths,weekly_cases,weekly_deaths,biweekly_cases,biweekly_deaths,...,total_boosters,daily_vaccinations_raw,daily_vaccinations,total_vaccinations_per_hundred,people_vaccinated_per_hundred,people_fully_vaccinated_per_hundred,total_boosters_per_hundred,daily_vaccinations_per_million,daily_people_vaccinated,daily_people_vaccinated_per_hundred
2021-02-22,Afghanistan,13,1,55617,2433,103,6,258,20,...,,,,0.0,0.0,,,,,
2021-02-23,Afghanistan,29,2,55646,2435,128,7,262,21,...,,,1367.0,,,,,33.0,1367.0,0.003
2021-02-24,Afghanistan,18,1,55664,2436,124,8,262,18,...,,,1367.0,,,,,33.0,1367.0,0.003
2021-02-25,Afghanistan,16,2,55680,2438,123,8,260,19,...,,,1367.0,,,,,33.0,1367.0,0.003
2021-02-26,Afghanistan,16,4,55696,2442,121,12,251,18,...,,,1367.0,,,,,33.0,1367.0,0.003
2021-02-27,Afghanistan,11,1,55707,2443,127,13,234,16,...,,,1367.0,,,,,33.0,1367.0,0.003


In [19]:
sub(" .*", "", "howdy partner")