In [1]:
import sys
sys.path.append('../src')

In [2]:
from covid import daily_snapshot
from pathlib import Path

import population as pop
import pandas as pd
import requests
import datetime as dt

In [3]:
pd.set_option('max_rows', 300) 

In [4]:
date = dt.date.today() - dt.timedelta(1)
date

datetime.date(2020, 4, 17)

In [5]:
dt.datetime.strftime(date, '%m-%d-%Y')

'04-17-2020'

### Quick glance at the data

In [6]:
df = daily_snapshot(dt.datetime.strftime(date, '%m-%d-%Y'))
df.head()

Unnamed: 0_level_0,Unnamed: 0,Admin2,Province_State,Country_Region,Last_Update,Lat,Long_,Confirmed,Deaths,Recovered,Active,Combined_Key
FIPS,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
45001.0,,Abbeville,South Carolina,US,2020-04-17 23:30:52,34.223334,-82.461707,10,0,0,10,"Abbeville, South Carolina, US"
22001.0,,Acadia,Louisiana,US,2020-04-17 23:30:52,30.295065,-92.414197,110,6,0,104,"Acadia, Louisiana, US"
51001.0,,Accomack,Virginia,US,2020-04-17 23:30:52,37.767072,-75.632346,28,0,0,28,"Accomack, Virginia, US"
16001.0,,Ada,Idaho,US,2020-04-17 23:30:52,43.452658,-116.241552,576,9,0,567,"Ada, Idaho, US"
19001.0,,Adair,Iowa,US,2020-04-17 23:30:52,41.330756,-94.471059,1,0,0,1,"Adair, Iowa, US"


## Most countries, US included, are not reporting Recovered column

In [7]:
df[(df.Country_Region=='US') & (df.Recovered != 0)]

Unnamed: 0_level_0,Unnamed: 0,Admin2,Province_State,Country_Region,Last_Update,Lat,Long_,Confirmed,Deaths,Recovered,Active,Combined_Key
FIPS,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
,,,Recovered,US,2020-04-17 23:30:52,,,0,0,58545,-58545,"Recovered, US"


## Who is using "Recovered" as a Province_State?

In [8]:
df[(df.Province_State=='Recovered')]

Unnamed: 0_level_0,Unnamed: 0,Admin2,Province_State,Country_Region,Last_Update,Lat,Long_,Confirmed,Deaths,Recovered,Active,Combined_Key
FIPS,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
,,,Recovered,Canada,2020-04-17 23:38:31,,,0,0,10545,-10545,"Recovered, Canada"
,,,Recovered,US,2020-04-17 23:30:52,,,0,0,58545,-58545,"Recovered, US"


## Who is reporting Recovered?

In [9]:
df[(df.Province_State == 'Recovered')].sort_values("Country_Region")

Unnamed: 0_level_0,Unnamed: 0,Admin2,Province_State,Country_Region,Last_Update,Lat,Long_,Confirmed,Deaths,Recovered,Active,Combined_Key
FIPS,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
,,,Recovered,Canada,2020-04-17 23:38:31,,,0,0,10545,-10545,"Recovered, Canada"
,,,Recovered,US,2020-04-17 23:30:52,,,0,0,58545,-58545,"Recovered, US"


## Only Australia and China are reporting recovered by real province or state

In [10]:
df[(df.Recovered != 0) & (df.Province_State != 'Recovered') & (pd.notnull(df.Province_State))].sort_values('Country_Region')

Unnamed: 0_level_0,Unnamed: 0,Admin2,Province_State,Country_Region,Last_Update,Lat,Long_,Confirmed,Deaths,Recovered,Active,Combined_Key
FIPS,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
,,,Western Australia,Australia,2020-04-17 23:38:48,-31.9505,115.8605,541,7,340,194,"Western Australia, Australia"
,,,Australian Capital Territory,Australia,2020-04-17 23:38:48,-35.4735,149.0124,103,3,81,19,"Australian Capital Territory, Australia"
,,,Victoria,Australia,2020-04-17 23:38:48,-37.8136,144.9631,1302,14,1159,129,"Victoria, Australia"
,,,Tasmania,Australia,2020-04-17 23:38:48,-42.8821,147.3272,180,7,67,106,"Tasmania, Australia"
,,,South Australia,Australia,2020-04-17 23:38:48,-34.9285,138.6007,435,4,331,100,"South Australia, Australia"
,,,New South Wales,Australia,2020-04-17 23:38:48,-33.8688,151.2093,2926,26,1379,1521,"New South Wales, Australia"
,,,Queensland,Australia,2020-04-17 23:38:48,-27.4698,153.0251,1007,5,442,560,"Queensland, Australia"
,,,Northern Territory,Australia,2020-04-17 23:38:48,-12.4634,130.8456,28,0,9,19,"Northern Territory, Australia"
,,,Jiangsu,China,2020-04-17 01:05:09,32.9711,119.455,653,0,643,10,"Jiangsu, China"
,,,Inner Mongolia,China,2020-04-17 02:03:55,44.0935,113.9448,193,1,103,89,"Inner Mongolia, China"
