In [1]:
import pandas as pd

# Load the dataset
df = pd.read_csv('/content/covid_vaccine_statewise.csv')

# Display basic description
print("Dataset Description:")
print(f"Number of rows: {df.shape[0]}")
print(f"Number of columns: {df.shape[1]}")
print("\nColumn names and data types:")
print(df.dtypes)
print("\nMissing values per column:")
print(df.isnull().sum())
print("\nBasic statistics:")
print(df.describe())

Dataset Description:
Number of rows: 7845
Number of columns: 24

Column names and data types:
Updated On                              object
State                                   object
Total Doses Administered               float64
Sessions                               float64
 Sites                                 float64
First Dose Administered                float64
Second Dose Administered               float64
Male (Doses Administered)              float64
Female (Doses Administered)            float64
Transgender (Doses Administered)       float64
 Covaxin (Doses Administered)          float64
CoviShield (Doses Administered)        float64
Sputnik V (Doses Administered)         float64
AEFI                                   float64
18-44 Years (Doses Administered)       float64
45-60 Years (Doses Administered)       float64
60+ Years (Doses Administered)         float64
18-44 Years(Individuals Vaccinated)    float64
45-60 Years(Individuals Vaccinated)    float64
60+ Years(Ind

In [2]:
# Get latest data for each state (assuming the dataset has daily cumulative numbers)
latest_data = df.sort_values('Updated On').groupby('State').last()

# Filter for first dose
first_dose = latest_data[['First Dose Administered']].sort_values('First Dose Administered', ascending=False)

print("\nState-wise first dose vaccinations:")
print(first_dose)


State-wise first dose vaccinations:
                                          First Dose Administered
State                                                            
India                                                 361264651.0
Uttar Pradesh                                          40485878.0
Maharashtra                                            33167633.0
Madhya Pradesh                                         26830212.0
Gujarat                                                25341390.0
Rajasthan                                              24972030.0
Karnataka                                              23841981.0
West Bengal                                            20837318.0
Bihar                                                  20551758.0
Tamil Nadu                                             18835602.0
Andhra Pradesh                                         16096801.0
Kerala                                                 14111255.0
Odisha                                 

In [3]:
# Filter for second dose
second_dose = latest_data[['Second Dose Administered']].sort_values('Second Dose Administered', ascending=False)

print("\nState-wise second dose vaccinations:")
print(second_dose)


State-wise second dose vaccinations:
                                          Second Dose Administered
State                                                             
India                                                  101848788.0
Maharashtra                                             11191970.0
West Bengal                                              8681380.0
Gujarat                                                  7937490.0
Uttar Pradesh                                            7790151.0
Rajasthan                                                7496590.0
Karnataka                                                6529233.0
Kerala                                                   6053845.0
Andhra Pradesh                                           5572592.0
Madhya Pradesh                                           5168997.0
Tamil Nadu                                               4200590.0
Odisha                                                   3915473.0
Bihar                   

In [4]:
# Calculate total males vaccinated (sum across all states)
total_males = latest_data['Male(Individuals Vaccinated)'].sum()

print(f"\nTotal males vaccinated: {total_males:,.0f}")


Total males vaccinated: 90,095,606


In [5]:
# Calculate total females vaccinated (sum across all states)
total_females = latest_data['Female(Individuals Vaccinated)'].sum()

print(f"\nTotal females vaccinated: {total_females:,.0f}")


Total females vaccinated: 78,271,582
