In [None]:
import pandas as pd

pd.set_option("display.max_columns", None)

In [None]:
DATA_PATH = "./data/"

# Interventions

This dataset contains a series of important dates associated with the pandemic for different countries.

We augment the dataset by adding columns that represent how long it took for measures to be imposed after the first case, and how long the abnormal mobility period lasted for. These values can tell us how quick governments were to respond and how long they imposed measures for.

In [None]:
interventions = pd.read_csv(DATA_PATH + "interventions.csv", index_col="lang")

# Convert columns to datetime
interventions = interventions.apply(pd.to_datetime)

# Period between date of 1st case and date of first imposed measure
interventions["Response time"] = (
    interventions[["School closure", "Public events banned", "Lockdown"]].min(axis=1)
    - interventions["1st case"]
)

# Duration of abnormal mobility
interventions["Reduced mobility"] = (
    interventions["Normalcy"] - interventions["Mobility"]
)

interventions

# Google Mobility Data

In [None]:
mobility_data = pd.read_csv(
    DATA_PATH + "Global_Mobility_Report.csv.gz", parse_dates=["date"], low_memory=False,
)

mobility_data.head()

# Apple Mobility Data

In [None]:
transport_data = pd.read_csv(
    DATA_PATH + "applemobilitytrends-2020-04-20.csv.gz",
    index_col=["region", "transportation_type"],
)

transport_data.head()

# Wikipedia Page Topics

In [None]:
topics_linked = pd.read_csv(DATA_PATH + "topics_linked.csv.xz", index_col="index")

topics_linked.head()

# Aggregated Time Series of Wikipedia Pageviews

In [None]:
pageviews = pd.read_json(DATA_PATH + "aggregated_timeseries.json.gz")

pageviews