In [1]:
import numpy as np
import pandas as pd

# 1. Data

### 1.1. OXCGRT Data 

In [2]:
data = pd.read_csv('../Data/Covid19_All_20210710.csv', low_memory=False, index_col=0)

### 1.2. Continent Data

In [3]:
continent = pd.read_csv('../Data/continent_data.csv', low_memory=False, index_col=0)
continent = continent[['Continent_Name', 'Three_Letter_Country_Code']]
continent.columns = ['ContinentName', 'CountryCode']

# add Kosovo
continent = continent.append({'ContinentName': 'Europe', 
                              'CountryCode': 'RKS'}, ignore_index=True)

# 2. Merge

In [4]:
data_merged = data.merge(continent, how='left', on='CountryCode')

# 3. Filtering

In [5]:
cols = ['CountryName', 'ContinentName', 'RegionName', 'Date', 'C1_School closing',
       'C2_Workplace closing', 'C3_Cancel public events', 
       'C4_Restrictions on gatherings', 'C5_Close public transport',
       'C6_Stay at home requirements', 'C7_Restrictions on internal movement', 
       'C8_International travel controls', 'E1_Income support',
       'E2_Debt/contract relief', 'E3_Fiscal measures',
       'E4_International support', 'H1_Public information campaigns', 
       'H2_Testing policy', 'H3_Contact tracing', 'H4_Emergency investment in healthcare', 
       'H5_Investment in vaccines', 'H6_Facial Coverings', 
       'H7_Vaccination policy', 'H8_Protection of elderly people', 
       'ConfirmedCases', 'ConfirmedDeaths']

### Asia

In [6]:
asia = data_merged.loc[data_merged.ContinentName == 'Asia', cols]

In [11]:
asia.sample(5)

Unnamed: 0,CountryName,ContinentName,RegionName,Date,C1_School closing,C2_Workplace closing,C3_Cancel public events,C4_Restrictions on gatherings,C5_Close public transport,C6_Stay at home requirements,...,H1_Public information campaigns,H2_Testing policy,H3_Contact tracing,H4_Emergency investment in healthcare,H5_Investment in vaccines,H6_Facial Coverings,H7_Vaccination policy,H8_Protection of elderly people,ConfirmedCases,ConfirmedDeaths
89164,Israel,Asia,,2020-02-14,0.0,0.0,0.0,0.0,0.0,0.0,...,2.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0
90909,Jordan,Asia,,2020-04-28,3.0,2.0,2.0,4.0,2.0,2.0,...,2.0,2.0,1.0,0.0,0.0,0.0,0.0,2.0,449.0,8.0
49316,China,Asia,Jiangsu,2020-10-27,0.0,1.0,1.0,1.0,1.0,1.0,...,2.0,2.0,2.0,0.0,0.0,3.0,0.0,2.0,670.0,0.0
137358,Timor-Leste,Asia,,2020-12-02,1.0,0.0,0.0,0.0,0.0,2.0,...,2.0,3.0,2.0,0.0,0.0,3.0,0.0,0.0,31.0,0.0
48399,China,Asia,Hunan,2021-05-12,1.0,1.0,1.0,0.0,0.0,0.0,...,2.0,3.0,2.0,0.0,0.0,2.0,4.0,1.0,1046.0,4.0


In [13]:
asia.to_csv('Asia_covid19_20210710.csv')

### Europe

In [7]:
europe = data_merged.loc[data_merged.ContinentName == 'Europe', cols]

In [12]:
europe.sample(5)

Unnamed: 0,CountryName,ContinentName,RegionName,Date,C1_School closing,C2_Workplace closing,C3_Cancel public events,C4_Restrictions on gatherings,C5_Close public transport,C6_Stay at home requirements,...,H1_Public information campaigns,H2_Testing policy,H3_Contact tracing,H4_Emergency investment in healthcare,H5_Investment in vaccines,H6_Facial Coverings,H7_Vaccination policy,H8_Protection of elderly people,ConfirmedCases,ConfirmedDeaths
106145,Malta,Europe,,2020-11-11,1.0,2.0,2.0,4.0,0.0,0.0,...,2.0,3.0,2.0,,,4.0,0.0,2.0,7537.0,88.0
4783,Austria,Europe,,2020-11-23,3.0,3.0,2.0,4.0,1.0,2.0,...,2.0,3.0,2.0,0.0,0.0,3.0,0.0,3.0,250333.0,2459.0
89109,Iceland,Europe,,2021-06-30,2.0,0.0,0.0,0.0,0.0,0.0,...,2.0,3.0,2.0,0.0,0.0,0.0,5.0,0.0,6555.0,29.0
77803,Georgia,Europe,,2020-07-09,3.0,2.0,2.0,4.0,0.0,1.0,...,2.0,2.0,2.0,0.0,0.0,2.0,0.0,1.0,968.0,15.0
132251,Sweden,Europe,,2020-08-30,1.0,1.0,2.0,3.0,1.0,1.0,...,2.0,2.0,1.0,0.0,0.0,0.0,0.0,3.0,83958.0,5821.0


In [14]:
europe.to_csv('Europe_covid19_20210710.csv')

### USA

In [11]:
usa = data_merged.loc[data_merged.CountryName == 'United States']

In [18]:
usa.sample(5)

Unnamed: 0,CountryName,CountryCode,RegionName,RegionCode,Jurisdiction,Date,C1_School closing,C1_Flag,C2_Workplace closing,C2_Flag,...,StringencyIndexForDisplay,StringencyLegacyIndex,StringencyLegacyIndexForDisplay,GovernmentResponseIndex,GovernmentResponseIndexForDisplay,ContainmentHealthIndex,ContainmentHealthIndexForDisplay,EconomicSupportIndex,EconomicSupportIndexForDisplay,ContinentName
151961,United States,USA,Illinois,US_IL,STATE_TOTAL,2021-04-02,2.0,0.0,1.0,1.0,...,51.85,58.33,58.33,60.78,60.78,60.54,60.54,62.5,62.5,North America
153714,United States,USA,Kentucky,US_KY,STATE_TOTAL,2021-06-23,,,1.0,1.0,...,34.26,51.19,51.19,,,39.88,39.88,,,North America
163562,United States,USA,Ohio,US_OH,STATE_TOTAL,2020-12-27,2.0,0.0,1.0,1.0,...,58.33,64.29,64.29,61.35,61.35,64.76,64.76,37.5,37.5,North America
157800,United States,USA,Mississippi,US_MS,STATE_TOTAL,2020-06-18,3.0,1.0,1.0,1.0,...,62.96,76.9,76.9,57.55,57.55,56.85,56.85,62.5,62.5,North America
153849,United States,USA,Louisiana,US_LA,STATE_TOTAL,2020-04-27,3.0,1.0,2.0,1.0,...,75.93,79.76,79.76,65.89,65.89,62.8,62.8,87.5,87.5,North America


In [19]:
usa.to_csv('../Data/Covid19_USA.csv')