# Setup

In [1]:
LOG_PLOT = False

In [2]:
%matplotlib notebook
from matplotlib import pyplot as plt
plt.style.use('seaborn-darkgrid')
import os
from helper import *
df = ecdc()
df_at = at()
def country_name(geoId):
    return df[df.geoId==geoId].iloc[0].countriesAndTerritories.replace('_', ' ')

print(df.columns)

Index(['dateRep', 'day', 'month', 'year', 'cases', 'deaths',
       'countriesAndTerritories', 'geoId', 'countryterritoryCode',
       'popData2019', 'continentExp',
       'Cumulative_number_for_14_days_of_COVID-19_cases_per_100000'],
      dtype='object')


## ECDC Data

In [3]:


def plot_selection(selection, roll_days=7, log=False):   
    f,ax = plt.subplots()
    ax.plot(selection.dateRep, selection['cases'].rolling(roll_days).mean(), label=f'{roll_days} day average', marker='o', markersize=4, linestyle='--')
#     ax.xaxis.set_major_locator(plt.MaxNLocator(20))
    ax.xaxis.set_major_locator(plt.MaxNLocator(20))

    plt.xticks(rotation=45)
    ax.bar(selection.dateRep, selection['cases'],label='recorded',  alpha=0.6, color='C1')
    plt.legend(loc='best')
    if log:
        plt.yscale('log')
        
    plt.title(selection.iloc[0].countriesAndTerritories.replace('_', ' '))
    plt.tight_layout()

    return f

def plot_comparison(geoIds, roll_days=1, 
                    field='Cumulative_number_for_14_days_of_COVID-19_cases_per_100000',
                    log=False, ndays=30):
    f,ax = plt.subplots(figsize=(9,6))
    for geoId in geoIds:
        selection = select_country(geoId, ndays)
        ax.plot(selection.dateRep, selection[field], 
                label=country_name(geoId))

    ax.xaxis.set_major_locator(plt.MaxNLocator(25))
    ax.yaxis.set_major_locator(plt.MaxNLocator(10))

    plt.xticks(rotation=45)
    if log:
        plt.yscale('log')
        
    plt.legend(loc='best')
    plt.title('Cumulative number for 14 days of COVID-19 cases per 100000')
    plt.tight_layout()

def select_country(geoId, ndays=0):
    if not ndays:
        selection = df[df.geoId==geoId].sort_values(by=['year','month','day'], ascending=True)
    else:
        selection = df[df.geoId==geoId].sort_values(by=['year','month','day'], ascending=True).tail(ndays)
        
    return selection

def plot_country(geoId, **kwargs):
    return plot_selection(select_country(geoId), **kwargs)
    


## Austria - from Gesundheitsminesterium

In [4]:

def plot_Austria(roll_days=7, log=False):
    df = at()
    f,ax = plt.subplots()
    ax.plot(df.time, df['tägliche Erkrankungen'].rolling(roll_days).mean(), label=f'{roll_days} day average', marker='o', markersize=4, linestyle='--')
    ax.xaxis.set_major_locator(plt.MaxNLocator(20))
    plt.xticks(rotation=45)
    ax.bar(df.time, df['tägliche Erkrankungen'],label='recorded',  alpha=0.6, color='C1')
    plt.legend(loc='best')
    plt.title('Positive COVID tests')
    if log:
        plt.yscale('log')
    plt.tight_layout()
    return f


## DF Subsets

In [5]:
EU = df[df.continentExp=='Europe']
AMERICA = df[(df.continentExp=='America')]


# Overview

## Austria, USA, India, ...

In [15]:
# countries = ['AT', 'IN', 'US', 'UK', 'DE', 'NL', 'FR',  'IT', 'ES','EL' ]
countries = ('AT', 'IN', 'US', 'UK', 'NL', 'DE')
SELECTION =  df[df.geoId.isin(countries)]

plot_comparison(countries, log=False, ndays=500)
overview(SELECTION, compact=False)

<IPython.core.display.Javascript object>

Unnamed: 0_level_0,cases,cases,cases,deaths,deaths,deaths,deaths,deaths,Cumulative_number_for_14_days_of_COVID-19_cases_per_100000,Cumulative_number_for_14_days_of_COVID-19_cases_per_100000
Unnamed: 0_level_1,rolling_avg,last_5_days,max,sum,last_7_days_sum,rolling_avg,last_5_days,max,latest,max
countriesAndTerritories,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2
India,70960,"78524, 70496, 73272, 74383, 66732",97894,109150,6465,924,"971, 964, 926, 918, 816",2003,76.538525,94.173835
United_States_of_America,49243,"48182, 56800, 58082, 54271, 43597",78427,214771,4977,711,"892, 972, 1014, 590, 394",4928,196.769077,282.723242
United_Kingdom,14391,"14162, 17540, 13864, 15165, 12872",22961,42825,475,68,"70, 77, 87, 81, 65",1224,253.194767,253.194767
Netherlands,5529,"4979, 5813, 5959, 6493, 6368",6493,6575,130,19,"36, 13, 13, 23, 17",234,364.190524,364.190524
Germany,3178,"4058, 4516, 4721, 3483, 0",6294,9615,81,12,"16, 11, 15, 11, 0",315,45.208812,86.358323
Austria,1052,"947, 1221, 1181, 901, 1298",1298,864,51,7,"4, 9, 4, 1, 6",31,141.294931,141.294931


## Sweden and the world

In [7]:
countries = ('SE', 'ES','FR','UK','DE','AT','IT','NO','DK','FI')
plot_comparison(countries, log=False, ndays=500)


<IPython.core.display.Javascript object>

## Most cases in the last 7 days

### Europe

In [16]:
overview(EU, compact=True).head(5)

Unnamed: 0_level_0,cases,cases,cases,deaths,deaths,deaths,deaths,deaths
Unnamed: 0_level_1,rolling_avg,latest,max,sum,last_7_days_sum,rolling_avg,latest,max
countriesAndTerritories,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
France,16543,16101,26896,32730,500,71,46,2004
United_Kingdom,14391,12872,22961,42825,475,68,65,1224
Russia,11960,13634,13634,22597,1239,177,143,312
Spain,10169,0,31785,32929,843,120,0,1179
Netherlands,5529,6368,6493,6575,130,19,17,234


### America

In [17]:
overview(AMERICA).head(5)

Unnamed: 0_level_0,cases,cases,cases,deaths,deaths,deaths,deaths,deaths
Unnamed: 0_level_1,rolling_avg,latest,max,sum,last_7_days_sum,rolling_avg,latest,max
countriesAndTerritories,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
United_States_of_America,49243,43597,78427,214771,4977,711,394,4928
Brazil,25670,12345,69074,150488,4136,591,290,1595
Argentina,13674,10310,17213,23868,2850,407,287,3351
Colombia,8038,8569,13056,27834,1122,160,174,400
Mexico,7523,0,30468,83642,4554,651,0,3013


### World

In [18]:
overview(df).head(5)

Unnamed: 0_level_0,cases,cases,cases,deaths,deaths,deaths,deaths,deaths
Unnamed: 0_level_1,rolling_avg,latest,max,sum,last_7_days_sum,rolling_avg,latest,max
countriesAndTerritories,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
India,70960,66732,97894,109150,6465,924,816,2003
United_States_of_America,49243,43597,78427,214771,4977,711,394,4928
Brazil,25670,12345,69074,150488,4136,591,290,1595
France,16543,16101,26896,32730,500,71,46,2004
United_Kingdom,14391,12872,22961,42825,475,68,65,1224


## Lowset number of new cases in the last 7 days

### Europe*

\*among countries with population of at least 1 million

In [19]:
overview(EU[EU.popData2019>1*10**7], compact=False).tail(5)

Unnamed: 0_level_0,cases,cases,cases,deaths,deaths,deaths,deaths,deaths,Cumulative_number_for_14_days_of_COVID-19_cases_per_100000,Cumulative_number_for_14_days_of_COVID-19_cases_per_100000
Unnamed: 0_level_1,rolling_avg,last_5_days,max,sum,last_7_days_sum,rolling_avg,last_5_days,max,latest,max
countriesAndTerritories,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2
Romania,3031,"2958, 3130, 3186, 3517, 2880",3517,5411,464,66,"82, 44, 52, 59, 53",101,167.967604,167.967604
Portugal,1202,"944, 1278, 1394, 1646, 1090",1646,2080,85,12,"8, 10, 12, 5, 13",60,127.084623,127.084623
Sweden,378,"831, 657, 0, 0, 0",1698,5894,3,0,"0, 0, 0, 0, 0",115,72.462033,146.155715
Greece,359,"406, 434, 391, 306, 280",460,449,40,6,"4, 6, 1, 5, 13",13,45.819895,45.819895
Azerbaijan,184,"182, 191, 215, 233, 230",590,609,13,2,"2, 1, 2, 3, 1",13,19.496962,76.226256


### America*

\*among countries with population of at least 10 million

In [20]:
overview(AMERICA[AMERICA.popData2019>1*10**7]).tail(5)


Unnamed: 0_level_0,cases,cases,cases,deaths,deaths,deaths,deaths,deaths
Unnamed: 0_level_1,rolling_avg,latest,max,sum,last_7_days_sum,rolling_avg,latest,max
countriesAndTerritories,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
Dominican_Republic,571,463,2147,2173,39,6,6,39
Guatemala,536,171,4233,3384,91,13,19,74
Bolivia,244,111,2687,8308,207,30,16,1610
Cuba,24,30,93,123,1,0,0,6
Haiti,9,22,284,230,1,0,0,12


### World*
\*among countries with population of at least 10 million

In [21]:
overview( df[df.popData2019>1*10**7]).tail(5)


Unnamed: 0_level_0,cases,cases,cases,deaths,deaths,deaths,deaths,deaths
Unnamed: 0_level_1,rolling_avg,latest,max,sum,last_7_days_sum,rolling_avg,latest,max
countriesAndTerritories,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
Taiwan,1,0,31,7,0,0,0,3
Yemen,1,0,116,596,5,1,1,52
Cambodia,0,0,35,0,0,0,0,0
United_Republic_of_Tanzania,0,0,174,21,0,0,0,6
Niger,0,0,69,69,0,0,0,5


# Austria
Compare ECDC data with Gesundheitsminesterium Data

## Plots

In [22]:
plot_Austria();
plot_country('AT', log=LOG_PLOT);

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

### Weekday bias

In [34]:
f, ax = plt.subplots(nrows=2, sharex=True)
df_at.groupby(['weekday']).sum()['tägliche Erkrankungen'].plot(ax=ax[0], marker='o')
ax[0].set_ylabel('Reported positive tests (Total)')
df_at.groupby(['weekday']).median()['tägliche Erkrankungen'].plot(ax=ax[1], marker='o')
ax[1].set_ylabel('Reported positive tests (Median)')
ax[1].set_xlabel('Day of the week')
ax[1].set_xticks([0,1,2,3,4,5,6])
ax[1].set_xticklabels(WEEKDAYS, rotation=40)
plt.tight_layout()

<IPython.core.display.Javascript object>

# India

In [35]:
plot_country('IN', log=LOG_PLOT);

<IPython.core.display.Javascript object>

# USA

In [36]:
plot_country('US', log=LOG_PLOT);


<IPython.core.display.Javascript object>

# Germany

In [37]:
plot_country('DE', log=LOG_PLOT);

<IPython.core.display.Javascript object>

## UK

In [38]:
plot_country('UK', log=LOG_PLOT);

<IPython.core.display.Javascript object>

# China

In [39]:
plot_country('CN', log=LOG_PLOT);


<IPython.core.display.Javascript object>

# Commit and Push

In [62]:
%cd Documents/code/covid19/
now = datetime.now()
commit_message = "Last run on " + now.strftime('%Y-%m-%d %H:%M')
commit_message
! echo $commit_message > commit_message.txt
! git add .
! git commit -F commit_message.txt
! git push


[Errno 2] No such file or directory: 'Documents/code/covid19/'
/home/gythaogg/Documents/code/covid19/notebooks
[feature/angular 1cd82d8] Last run on 2020-10-11 23:30
 2 files changed, 1162 insertions(+), 1545 deletions(-)
Enumerating objects: 9, done.
Counting objects: 100% (9/9), done.
Delta compression using up to 16 threads
Compressing objects: 100% (5/5), done.
Writing objects: 100% (5/5), 177.21 KiB | 2.27 MiB/s, done.
Total 5 (delta 4), reused 0 (delta 0)
remote: Resolving deltas: 100% (4/4), completed with 4 local objects.[K
To github.com:gythaogg/covid19.git
   7dae54a..1cd82d8  feature/angular -> feature/angular


In [41]:
! git push --set-upstream origin feature/angular


Branch 'feature/angular' set up to track remote branch 'feature/angular' from 'origin'.
Everything up-to-date
