In [72]:
import numpy as np
import pandas as pd
import seaborn as sns
from matplotlib import pyplot as plt
import missingno as msno
from datetime import date
from sklearn.metrics import accuracy_score
from sklearn.model_selection import train_test_split
from sklearn.neighbors import LocalOutlierFactor
from sklearn.preprocessing import MinMaxScaler, LabelEncoder, StandardScaler, RobustScaler

In [73]:
pd.set_option("display.max_columns", None)
pd.set_option("display.max_rows", None)
pd.set_option("display.float_format", lambda x: "%.3f" % x) ## virgülden sonra üç basamak için
pd.set_option("display.width", 500)

In [74]:
def load():
    data = pd.read_csv("DATA/country_vaccination_stats.csv")
    return data

In [75]:
df = load()

In [76]:
df

Unnamed: 0,country,date,daily_vaccinations,vaccines
0,Argentina,12/29/2020,,Sputnik V
1,Argentina,12/30/2020,15656.0,Sputnik V
2,Argentina,12/31/2020,15656.0,Sputnik V
3,Argentina,1/1/2021,11070.0,Sputnik V
4,Argentina,1/2/2021,8776.0,Sputnik V
5,Argentina,1/3/2021,7400.0,Sputnik V
6,Argentina,1/4/2021,6483.0,Sputnik V
7,Argentina,1/5/2021,7984.0,Sputnik V
8,Argentina,1/6/2021,8173.0,Sputnik V
9,Argentina,1/7/2021,8363.0,Sputnik V


In [77]:
df.shape

(1502, 4)

In [78]:
# Calculate the minimum number of daily vaccinations for each country
minimum_vaccinations = df.groupby('country')['daily_vaccinations'].min()

In [79]:
for index, row in df.iterrows():
    if pd.isnull(row['daily_vaccinations']):
        if row['country'] in minimum_vaccinations:
            df.at[index, 'daily_vaccinations'] = minimum_vaccinations[row['country']]
        else:
            df.at[index, 'daily_vaccinations'] = 0

In [80]:
print(df)

                   country        date  daily_vaccinations                               vaccines
0                Argentina  12/29/2020            6483.000                              Sputnik V
1                Argentina  12/30/2020           15656.000                              Sputnik V
2                Argentina  12/31/2020           15656.000                              Sputnik V
3                Argentina    1/1/2021           11070.000                              Sputnik V
4                Argentina    1/2/2021            8776.000                              Sputnik V
5                Argentina    1/3/2021            7400.000                              Sputnik V
6                Argentina    1/4/2021            6483.000                              Sputnik V
7                Argentina    1/5/2021            7984.000                              Sputnik V
8                Argentina    1/6/2021            8173.000                              Sputnik V
9                Arg

In [81]:
# Calculate the average number of daily vaccinations for each country
ortalama_aşılama = df.groupby('country')['daily_vaccinations'].mean()

In [82]:
# Find the top 3 countries with the highest average daily vaccinations
en_yüksek_3_ülke = ortalama_aşılama.nlargest(3)

In [83]:
print("En yüksek ortalama günlük aşılama sayısına sahip ilk 3 ülke:")
print(en_yüksek_3_ülke)

En yüksek ortalama günlük aşılama sayısına sahip ilk 3 ülke:
country
United States   514833.703
China           327220.081
India           171920.545
Name: daily_vaccinations, dtype: float64


In [91]:
# Filter rows with date 1/6/2021
tarih_filtresi = df['date'] == "1/6/2021"

In [92]:
tarih_üzerindeki_veri = df[tarih_filtresi]

In [93]:
# Find the total number of vaccinations
toplam_aşılama_sayısı = tarih_üzerindeki_veri['daily_vaccinations'].sum()

In [94]:
print("1/6/2021 tarihinde yapılan toplam aşılama sayısı:", toplam_aşılama_sayısı)

1/6/2021 tarihinde yapılan toplam aşılama sayısı: 1485255.0
