### **A comparison between:**
- the amount of people that got intensive care and the amount of people that passed away
  - check if there is any correlation between the two

In [1]:
import pandas as pd
import plotly_express as px

df = pd.read_excel("../Data/Folkhalsomyndigheten_Covid19.xlsx", sheet_name="Totalt antal per åldersgrupp")
df

Unnamed: 0,Åldersgrupp,Totalt_antal_fall,Totalt_antal_intensivvårdade,Totalt_antal_avlidna
0,Ålder_0_9,138071,109,17
1,Ålder_10_19,355823,101,9
2,Ålder_20_29,418506,285,41
3,Ålder_30_39,493443,492,71
4,Ålder_40_49,474702,997,172
5,Ålder_50_59,378468,1932,523
6,Ålder_60_69,180079,2595,1422
7,Ålder_70_79,87096,2394,4654
8,Ålder_80_89,58170,612,8326
9,Ålder_90_plus,26677,21,5420


### Decided to remove the row with "Uppgift saknas" as it was hard to interpret the data

In [2]:
df.drop([10], inplace=True)

In [3]:
# calculating the percentage of people that got intensive care in comparison to the total amount of people that got infected
df["Procent_intensivvårdade"] = (df["Totalt_antal_intensivvårdade"]/df["Totalt_antal_fall"])*100

# calculating the percentage of people that passed away in comparison to the total amount of people that got infected
df["Procent_avlidna"] = df["Totalt_antal_avlidna"]/df["Totalt_antal_fall"]*100
df

Unnamed: 0,Åldersgrupp,Totalt_antal_fall,Totalt_antal_intensivvårdade,Totalt_antal_avlidna,Procent_intensivvårdade,Procent_avlidna
0,Ålder_0_9,138071,109,17,0.078945,0.012313
1,Ålder_10_19,355823,101,9,0.028385,0.002529
2,Ålder_20_29,418506,285,41,0.068099,0.009797
3,Ålder_30_39,493443,492,71,0.099708,0.014389
4,Ålder_40_49,474702,997,172,0.210027,0.036233
5,Ålder_50_59,378468,1932,523,0.510479,0.138189
6,Ålder_60_69,180079,2595,1422,1.441034,0.789653
7,Ålder_70_79,87096,2394,4654,2.748691,5.343529
8,Ålder_80_89,58170,612,8326,1.052089,14.31322
9,Ålder_90_plus,26677,21,5420,0.078719,20.317127


In [4]:
px.bar(
    df,
    x="Åldersgrupp",
    y="Procent_intensivvårdade",
    title="Procent av fall som behövde intensivvård",
    log_y=True, # log scale on the y-axis to make the difference between the groups more visible
)


In [5]:
px.bar(
    df.sort_values(by="Procent_avlidna"),
    x="Åldersgrupp",
    y="Procent_avlidna",
    title="Procent av fall som avled",
    log_y=True,
)

In [6]:
px.histogram(
    df,
    x="Åldersgrupp",
    y=["Procent_intensivvårdade", "Procent_avlidna"],
    title="Procent av fall som avled och behövde intensivvård",
    barmode="group",
    log_y=True, 
)

In [7]:
# in the graph above we can see the ratio between the amount of people that got intensive care and the amount of people that passed away
# as we can see from the graph above, after the 60 to 69 age group, 
# the percentage of people that died is higher than the percentage of people that needed intensive care. 
# this is probably because the people that are older than 69 are more likely to have a pre-existing condition,
# which makes them more likely to die from the virus.
# so we can conclude to a certain extent that the older you are, the more likely you are to die from the virus.