# Basic stats on the evolution of COVID-19 hospitalizations in departments

In [1]:
%load_ext lab_black
%matplotlib inline

In [2]:
import matplotlib.pyplot as plt
from datetime import timedelta, date
import pandas as pd
import warnings

warnings.filterwarnings("ignore")
pd.plotting.register_matplotlib_converters()

In [3]:
covid_url = (
    "https://www.data.gouv.fr/fr/datasets/r/63352e38-d353-4b54-bfd1-f1b3ee1cabd7"
)
filter_dep = ["971", "972", "973", "974", "976"]  # only metropolitan France
figsize = (15, 10)

#### <br> Load table with COVID-19 data (figures by dates)

In [4]:
df = pd.read_csv(covid_url, sep=";", parse_dates=True, index_col=2)
df = df.query("sexe == 0")  # sum male/female
df.drop(columns=["sexe"], inplace=True)
df.query("dep not in @filter_dep", inplace=True)
df.sort_index(inplace=True)
df.head(2)

Unnamed: 0_level_0,dep,hosp,rea,rad,dc
jour,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
2020-03-18,1,2,0,1,0
2020-03-18,2,41,10,18,11


In [5]:
last_day = df.index.max()
previous_day = last_day - timedelta(days=1)
print("Evolution from ", previous_day, " to ", last_day)

Evolution from  2020-04-03 00:00:00  to  2020-04-04 00:00:00


#### <br> Build a new dataframe with data from two latest days and the associated evolution

In [6]:
sdf = df.loc[last_day]
sdf.reset_index(inplace=True)
pdf = df.loc[previous_day]
pdf.reset_index(inplace=True)
frame = {"dep": sdf["dep"], "prev_hosp": pdf["hosp"], "last_hosp": sdf["hosp"]}
stats = pd.DataFrame(frame)
stats["diff"] = stats["last_hosp"] - stats["prev_hosp"]
stats["percent"] = stats["diff"] / stats["prev_hosp"] * 100
stats.head()

Unnamed: 0,dep,prev_hosp,last_hosp,diff,percent
0,1,100,109,9,9.0
1,2,210,223,13,6.190476
2,3,40,44,4,10.0
3,4,29,29,0,0.0
4,5,64,60,-4,-6.25


#### <br> Departments with highest number of hospitalizations on the latest day

In [7]:
stats.sort_values(by="last_hosp", ascending=False).head()

Unnamed: 0,dep,prev_hosp,last_hosp,diff,percent
75,75,2897,2999,102,3.520884
92,92,1848,1929,81,4.383117
94,94,1613,1651,38,2.355859
93,93,1267,1310,43,3.393844
69,69,1202,1215,13,1.081531


#### <br> Min, max, mean of evolution between the two latest days (in sum and %)

In [8]:
print(
    "Min: ",
    stats["diff"].min(),
    " Mean: ",
    stats["diff"].mean(),
    " Max: ",
    stats["diff"].max(),
)

Min:  -76  Mean:  7.427083333333333  Max:  102


In [9]:
print(
    "Min %: ",
    stats.percent.min(),
    " Mean %: ",
    stats.percent.mean(),
    " Max %: ",
    stats.percent.max(),
)

Min %:  -11.11111111111111  Mean %:  3.881928144902444  Max %:  29.411764705882355


#### <br> List of departments with a drecrease of hospitalizations (last two days)

In [10]:
stats.query("diff < 0")

Unnamed: 0,dep,prev_hosp,last_hosp,diff,percent
4,5,64,60,-4,-6.25
6,7,95,87,-8,-8.421053
8,9,16,15,-1,-6.25
11,12,60,58,-2,-3.333333
13,14,131,130,-1,-0.763359
15,16,18,17,-1,-5.555556
20,22,65,62,-3,-4.615385
30,30,70,66,-4,-5.714286
33,33,311,305,-6,-1.92926
34,34,264,252,-12,-4.545455


#### <br> Departments with highest evolution of hospitalizations (total number)

In [11]:
stats.sort_values(by="diff", ascending=False).head()

Unnamed: 0,dep,prev_hosp,last_hosp,diff,percent
75,75,2897,2999,102,3.520884
92,92,1848,1929,81,4.383117
91,91,831,911,80,9.626955
78,78,858,913,55,6.410256
59,59,729,773,44,6.035665


#### <br> Departments with highest rate of hospitalizations (%)

In [12]:
stats.sort_values(by="percent", ascending=False).head()

Unnamed: 0,dep,prev_hosp,last_hosp,diff,percent
40,40,17,22,5,29.411765
58,58,21,27,6,28.571429
9,10,110,141,31,28.181818
22,24,20,25,5,25.0
52,52,82,99,17,20.731707


#### <br> Focus on some departments

In [13]:
stats.query("dep=='75'")

Unnamed: 0,dep,prev_hosp,last_hosp,diff,percent
75,75,2897,2999,102,3.520884


In [14]:
stats.query("dep=='71'")

Unnamed: 0,dep,prev_hosp,last_hosp,diff,percent
71,71,163,162,-1,-0.613497


In [15]:
stats.query("dep=='31'")

Unnamed: 0,dep,prev_hosp,last_hosp,diff,percent
31,31,226,227,1,0.442478
