In [1]:
import pandas as pd
import datetime

from data_helpers import load_data, clean_data, export_data
from stats_helpers import growth_factor_for_region, cfr_for_region, lin_reg_for_time_series, new_cases_per_region

DATA_BASE_URL = 'https://raw.githubusercontent.com/CSSEGISandData/COVID-19/master/csse_covid_19_data/csse_covid_19_time_series/time_series_covid19_{}_global.csv'

In [2]:
raw_data = load_data(DATA_BASE_URL)
data = {key: clean_data(df) for key, df in raw_data.items()}

In [3]:
def compile_set_for_region(data, region):
    return {
        'confirmed': data['confirmed'][region],
        'new': new_cases_per_region(data, region),
        'deaths': data['deaths'][region],
        'recovered': data['recovered'][region],
        'growth_rate': growth_factor_for_region(data, region),
        'cfr': cfr_for_region(data, region),
        'cfr_lin_reg': lin_reg_for_time_series(cfr_for_region(data, region, t=7))
    }

In [4]:
regions = data['confirmed'].T.index
out = {region: compile_set_for_region(data, region) for region in regions }

In [5]:
ts = datetime.date.today().strftime('%Y%m%d')
filename = '{}_covid19_data.json'.format(ts)
pd.Series(out).to_json(filename, orient='columns')

print('Exported all aggregated data [ {} ].'.format(filename))

Exported all aggregated data [ 20200809_covid19_data.json ].
