# Infection Rate vs Public Announcements and Events
> Looking at the effect of Government announcements and public events on case loads.

- toc: true 
- badges: true
- comments: true
- categories: [jupyter]
- image: images/events.png

In [None]:
#hide

import pandas as pd
import numpy as np

import plotly.graph_objects as go
import plotly.express as px
import altair as alt

from IPython.display import HTML, display
import pytz

import ipywidgets as widgets

from datetime import datetime, timedelta, timezone

print('Libraries successfully imported.')

Libraries successfully imported.


In [None]:
#hide
#%%time

url = 'https://data.ontario.ca/dataset/f4112442-bdc8-45d2-be3c-12efae72fb27/resource/455fd63b-603d-4608-8216-7d8647f43350/download/conposcovidloc.csv'
url_2 = 'https://data.ontario.ca/dataset/f4f86e54-872d-43f8-8a86-3892fd3cb5e6/resource/ed270bb8-340b-41f9-a7c6-e8ef587e6d11/download/covidtesting.csv'
url_3 = 'https://data.ontario.ca/dataset/f4f86e54-872d-43f8-8a86-3892fd3cb5e6/resource/8a88fe6d-d8fb-41a3-9d04-f0550a44999f/download/daily_change_in_cases_by_phu.csv'

#geo = gpd.read_file('https://data.ontario.ca/dataset/f4112442-bdc8-45d2-be3c-12efae72fb27/resource/4f39b02b-47fe-4e66-95b6-e6da879c6910/download/conposcovidloc.geojson') 

src_conpos = pd.read_csv(url, index_col=0, parse_dates=['Accurate_Episode_Date', 'Case_Reported_Date', 'Test_Reported_Date', 'Specimen_Date']).reset_index()
src_testing = pd.read_csv(url_2, index_col=0, parse_dates=['Reported Date']).reset_index()
src_daily = pd.read_csv(url_3, index_col=0, parse_dates=['Date']).reset_index()

# duplicate entry for December 5th, 2020 causing error
src_testing.drop_duplicates(inplace=True)

print('Source files successfully loaded.')

Source files successfully loaded.


In [None]:
#hide

df_testing = src_testing.drop(['Confirmed Negative',	'Presumptive Negative',	'Presumptive Positive',
                  'Total patients approved for testing as of Reporting Date',
                  'Under Investigation'], axis=1).fillna(0)

df_testing['New Cases'] = df_testing['Total Cases'].fillna(0).diff()
df_testing['New Deaths'] = df_testing['Deaths'].fillna(0).diff()
df_testing['Completed Tests Cumulative'] = df_testing['Total tests completed in the last day'].cumsum()

# rolling averages
numdays = 7

df_testing['New Cases 5 Day Average'] = round(df_testing['New Cases'].rolling(5).mean())
df_testing['New Cases 7 Day Average'] = round(df_testing['New Cases'].rolling(numdays).mean())
df_testing['New Tests 7 Day Average'] = round(df_testing['Total tests completed in the last day'].rolling(numdays).mean())

df_testing['7 Day Avg Percent Positivity'] = round((df_testing['New Cases 7 Day Average'] / df_testing['New Tests 7 Day Average']) *100, 2)

df_testing

Unnamed: 0,Reported Date,Confirmed Positive,Resolved,Deaths,Total Cases,Total tests completed in the last day,Percent positive tests in last day,Number of patients hospitalized with COVID-19,Number of patients in ICU with COVID-19,Number of patients in ICU on a ventilator with COVID-19,Total Positive LTC Resident Cases,Total Positive LTC HCW Cases,Total LTC Resident Deaths,Total LTC HCW Deaths,New Cases,New Deaths,Completed Tests Cumulative,New Cases 5 Day Average,New Cases 7 Day Average,New Tests 7 Day Average,7 Day Avg Percent Positivity
0,2020-01-26,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,,,,
1,2020-01-27,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,
2,2020-01-28,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,,,,
3,2020-01-30,2.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,,,,
4,2020-01-31,2.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
314,2020-12-16,17084.0,125416.0,4035.0,146535.0,49189.0,5.1,932.0,256.0,157.0,9462.0,3717.0,2513.0,8.0,2139.0,43.0,6995407.0,1981.0,1962.0,56308.0,3.48
315,2020-12-17,17484.0,127425.0,4058.0,148967.0,58178.0,4.0,919.0,263.0,172.0,9538.0,3750.0,2526.0,8.0,2432.0,23.0,7053585.0,2093.0,2026.0,55789.0,3.63
316,2020-12-18,17742.0,129417.0,4098.0,151257.0,68246.0,3.9,877.0,261.0,168.0,9625.0,3809.0,2537.0,8.0,2290.0,40.0,7121831.0,2215.0,2089.0,56531.0,3.70
317,2020-12-19,18207.0,131282.0,4125.0,153614.0,67207.0,4.2,895.0,256.0,146.0,9755.0,3840.0,2546.0,8.0,2357.0,27.0,7189038.0,2299.0,2159.0,56810.0,3.80


In [None]:
#hide

# todo: webscrape Canadian website for holidays and dates for automation

public_events = [
{"name": "Easter Weekend", "date": "2020-04-10"},
{"name": "Mother's Day", "date": "2020-05-10", "ay" : 60},
{"name": "Victoria Day", "date": "2020-05-18"},
{"name": "Trinity Bellwoods<br>Park Weekend", "date": "2020-05-23", "ay": -100, "ax": 80},
{"name": "Father's Day", "date": "2020-06-21", "ay": 40},
{"name": "Canada Day", "date": "2020-07-01"},
{"name": "Civic Holiday", "date": "2020-08-03"},
{"name": "Schools reopen<br>for 2020-21", "date": "2020-09-08"},
{"name": "Thanksgiving<br>Weekend", "date": "2020-10-12", "ax": -40, "ay": -50},
{"name": "Halloween", "date": "2020-10-31", "ax": -20},
{"name": "Diwali", "date": "2020-11-14", "ax": -60, "ay": -25},
{"name": "Black Friday", "date": "2020-11-27", "ax": -20},
{"name": "Vaccine Rollout", "date": "2020-12-15"}
# {"name": "Christmas", "date": "2020-12-25"},
# {"name": "Boxing Week<br> begins", "date": "2020-12-26"},
# {"name": "New Year's Day", "date": "2021-01-01"},
]

government_events = [
{"name": "Ontario Lockdown #1", "date": "2020-03-23","ax": -20, "ay": -80},
#{"name": "Some regions enter stage 2", "date": "2020-06-08"},
{"name": "Ontario in Stage 2", "date": "2020-06-24", "ay": -40},
{"name": "Ontario in Stage 3", "date": "2020-07-31", "ay": -30},
{"name": "Schools reopen<br>for 2020-21", "date": "2020-09-08", "ax": -40, "ay": -80},
{"name": "Second Wave confirmed", "date": "2020-09-28", "ax": -40, "ay": -80},
{"name": "Peel/Toronto/Ottawa<br>revert to<br>modified Stage 2", "date": "2020-10-12","ax":30, "ay": 100},
{"name": "Peel/Ottawa<br>in Orange Zone", "date": "2020-11-07","ax": 25, "ay": 60},
{"name": "Peel/Toronto<br>in Red Zone", "date": "2020-11-12", "ax": -80, "ay": -30},
{"name": "Halton in Red Zone", "date": "2020-11-16", "ax": -50},
{"name": "Peel/Toronto in<br>Lockdown<br>#2", "date": "2020-11-23", "ay": -80},
{"name": "York/Windsor<br>in Lockdown<br>#2", "date": "2020-12-14", "ay": 80},
{"name": "Vaccine Rollout", "date": "2020-12-15"}          
]

other_events = [
{"name": "GoodLife email request to lobby MPPs", "date": "2020-10-28"},          
]

# Sources:
# https://www.peelschools.org/schools/reopening/Pages/default.aspx
# https://globalnews.ca/news/6859636/ontario-coronavirus-timeline/

In [None]:
#hide

# append events to an annotation dictionary

public_dates_annot = []

for event in public_events:
      if event["date"]:
        ax = event.get("ax")
        if ax is None:
            ax = 0
        ay = event.get("ay")
        if ay is None:
            ay = -60
        public_dates_annot.append(dict(
                  x=event["date"],
                  y=df_testing[df_testing["Reported Date"] == event["date"]]["New Cases 5 Day Average"].values[0],
                  xref="x",
                  yref="y",
                  text=event["name"],
                  showarrow=True,
                  arrowhead=3,
                  ax=ax,
                  ay=ay
        ))

government_dates_annot = []

for event in government_events:
      if event["date"]:
        ax = event.get("ax")
        if ax is None:
            ax = 0
        ay = event.get("ay")
        if ay is None:
            ay = -60
        government_dates_annot.append(dict(
                  x=event["date"],
                  y=df_testing[df_testing["Reported Date"] == event["date"]]["New Cases 5 Day Average"].values[0],
                  xref="x",
                  yref="y",
                  text=event["name"],
                  showarrow=True,
                  arrowhead=3,
                  ax=ax,
                  ay=ay
        ))

government_dates_annot[0]

{'arrowhead': 3,
 'ax': -20,
 'ay': -80,
 'showarrow': True,
 'text': 'Ontario Lockdown #1',
 'x': '2020-03-23',
 'xref': 'x',
 'y': 58.0,
 'yref': 'y'}

In [None]:
#hide_input

fig_public = go.Figure()
fig_public.add_trace(go.Scatter(x=df_testing['Reported Date'],
                               y=df_testing['New Cases 5 Day Average'],
                               mode="lines",
                               #line=dict(color="maroon", dash="dot"),
                               name='5d Rolling Avg',
                               showlegend=True
))

fig_public.update_layout(annotations=public_dates_annot,
                        title="Infection Rate Compared to Key Public Events",
                        template='ggplot2',
                        width=1000,
                        xaxis_title="Reported Date",
                        yaxis_title="Confirmed Cases")

fig_public.update_layout(legend=dict(
    orientation="h",
    yanchor="bottom",
    y=1.02,
    xanchor="right",
    x=1,))

In [None]:
#hide_input

fig_gov = go.Figure()
fig_gov.add_trace(go.Scatter(x=df_testing['Reported Date'],
                             y=df_testing['New Cases 5 Day Average'],
                             mode="lines",
                             #line=dict(color="blue", dash="dot"),
                             showlegend=True,
                             name='5d Rolling Avg',
 
))

fig_gov.update_layout(annotations=government_dates_annot,
                        title="Infection Rate Compared to Governement Announcements",
                        template='seaborn',
                        width=1000,
                        xaxis_title="Reported Date",
                        yaxis_title="Confirmed Cases",)

fig_gov.update_layout(legend=dict(
    orientation="h",
    yanchor="bottom",
    y=1.02,
    xanchor="right",
    x=1,))