In [7]:
import pandas as pd   ## Importing required libraries

In [8]:
# Load the dataset
df = pd.read_csv("covid_vaccine_statewise.csv")

In [9]:
# Display basic information about the dataset
print("Dataset Info:")
print(df.info())

print("\nFirst few rows:")
print(df.head())

Dataset Info:
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 7845 entries, 0 to 7844
Data columns (total 24 columns):
 #   Column                               Non-Null Count  Dtype  
---  ------                               --------------  -----  
 0   Updated On                           7845 non-null   object 
 1   State                                7845 non-null   object 
 2   Total Doses Administered             7621 non-null   float64
 3   Sessions                             7621 non-null   float64
 4    Sites                               7621 non-null   float64
 5   First Dose Administered              7621 non-null   float64
 6   Second Dose Administered             7621 non-null   float64
 7   Male (Doses Administered)            7461 non-null   float64
 8   Female (Doses Administered)          7461 non-null   float64
 9   Transgender (Doses Administered)     7461 non-null   float64
 10   Covaxin (Doses Administered)        7621 non-null   float64
 11  CoviShield (Dose

In [10]:
# Clean up column names (optional, for easier access)
df.columns = df.columns.str.strip()

In [13]:
# a. Describe the dataset
print("\nDataset Description:")
print(f"- Total Rows : {df.shape[0]}")
print(f"- Total Columns : {df.shape[1]}")
print(df.describe(include='all'))


Dataset Description:
- Total Rows : 7845
- Total Columns : 24
        Updated On  State  Total Doses Administered      Sessions  \
count         7845   7845              7.621000e+03  7.621000e+03   
unique         213     37                       NaN           NaN   
top     16/01/2021  Delhi                       NaN           NaN   
freq            37    213                       NaN           NaN   
mean           NaN    NaN              9.188171e+06  4.792358e+05   
std            NaN    NaN              3.746180e+07  1.911511e+06   
min            NaN    NaN              7.000000e+00  0.000000e+00   
25%            NaN    NaN              1.356570e+05  6.004000e+03   
50%            NaN    NaN              8.182020e+05  4.547000e+04   
75%            NaN    NaN              6.625243e+06  3.428690e+05   
max            NaN    NaN              5.132284e+08  3.501031e+07   

               Sites  First Dose Administered  Second Dose Administered  \
count    7621.000000             

In [14]:
# b. Number of persons state-wise vaccinated for first dose
first_dose_statewise = df.groupby('State')['First Dose Administered'].max().sort_values(ascending=False)
print("\nState-wise First Dose Vaccinations:")
print(first_dose_statewise)


State-wise First Dose Vaccinations:
State
India                                       400150406.0
Uttar Pradesh                                45932488.0
Maharashtra                                  35040812.0
Madhya Pradesh                               29723036.0
Gujarat                                      28101222.0
Rajasthan                                    27008606.0
Karnataka                                    25847691.0
Bihar                                        23350171.0
West Bengal                                  23257417.0
Tamil Nadu                                   20836674.0
Andhra Pradesh                               17628583.0
Kerala                                       15670747.0
Odisha                                       13954592.0
Telangana                                    11649268.0
Assam                                        10495293.0
Haryana                                      10086831.0
Chhattisgarh                                  9181482.0
Jhark

In [15]:
# c. Number of persons state-wise vaccinated for second dose
second_dose_statewise = df.groupby('State')['Second Dose Administered'].max().sort_values(ascending=False)
print("\nState-wise Second Dose Vaccinations:")
print(second_dose_statewise)


State-wise Second Dose Vaccinations:
State
India                                       113077994.0
Maharashtra                                  12112554.0
West Bengal                                   9132961.0
Gujarat                                       9051153.0
Uttar Pradesh                                 8515236.0
Rajasthan                                     8375056.0
Karnataka                                     7432852.0
Kerala                                        6426984.0
Andhra Pradesh                                6214312.0
Madhya Pradesh                                5733640.0
Tamil Nadu                                    4686034.0
Bihar                                         4484768.0
Odisha                                        4200094.0
Telangana                                     3965624.0
Delhi                                         3000536.0
Haryana                                       2923550.0
Chhattisgarh                                  2587695.0
Punj

In [16]:
# d. Total number of males vaccinated
total_males_vaccinated = df.groupby('State')['Male(Individuals Vaccinated)'].max().sum()
print("\nTotal number of males vaccinated in India:", total_males_vaccinated)


Total number of males vaccinated in India: 134941971.0


In [17]:
# e. Total number of females vaccinated
total_females_vaccinated = df.groupby('State')['Female(Individuals Vaccinated)'].max().sum()
print("Total number of females vaccinated in India:", total_females_vaccinated)

Total number of females vaccinated in India: 115668447.0
