In [1]:
!pip install pandas
!pip install numpy
!pip install sklearn

Collecting sklearn
  Downloading sklearn-0.0.post10.tar.gz (3.6 kB)
  Preparing metadata (setup.py) ... [?25l[?25hdone
Building wheels for collected packages: sklearn
  Building wheel for sklearn (setup.py) ... [?25l[?25hdone
  Created wheel for sklearn: filename=sklearn-0.0.post10-py3-none-any.whl size=2959 sha256=912d84ab9dbb2285acacbda673cb76fd5042457c78bc64a06d2738b0e123c55a
  Stored in directory: /root/.cache/pip/wheels/5b/f6/92/0173054cc528db7ffe7b0c7652a96c3102aab156a6da960387
Successfully built sklearn
Installing collected packages: sklearn
Successfully installed sklearn-0.0.post10


In [4]:
import pandas as pd
from sklearn.linear_model import LinearRegression
from datetime import datetime

# Load the data from your provided format
data = pd.read_csv('covid_19_india.csv')

# Convert the 'Date' column to a datetime object
data['Date'] = pd.to_datetime(data['Date'], format='%d-%m-%Y')

# Filter data for the desired date range (March 2020 to August 2021)
start_date = datetime(2020, 3, 1)
end_date = datetime(2021, 8, 31)
data = data[(data['Date'] >= start_date) & (data['Date'] <= end_date)]

# Group data by date to calculate the total cases, active cases, and deaths
data_grouped = data.groupby('Date').agg({
    'Confirmed': 'sum',
    'Cured': 'sum',
    'Deaths': 'sum'
}).reset_index()

# Add a numerical column representing the date (to use as a feature for linear regression)
data_grouped['Numerical_Date'] = (data_grouped['Date'] - start_date).dt.days

# Prepare the data for linear regression
X = data_grouped[['Numerical_Date']]
y_total_cases = data_grouped['Confirmed']
y_active_cases = data_grouped['Confirmed'] - data_grouped['Cured'] - data_grouped['Deaths']
y_deaths = data_grouped['Deaths']

# Initialize the linear regression models
model_total_cases = LinearRegression()
model_active_cases = LinearRegression()
model_deaths = LinearRegression()

# Fit the models to the data
model_total_cases.fit(X, y_total_cases)
model_active_cases.fit(X, y_active_cases)
model_deaths.fit(X, y_deaths)

# Make predictions for December 2021

december_2021_date = datetime(2021, 12, 1)
numerical_date_december_2021 = (december_2021_date - start_date).days

predicted_total_cases = model_total_cases.predict([[numerical_date_december_2021]])[0]
predicted_active_cases = model_active_cases.predict([[numerical_date_december_2021]])[0]
predicted_deaths = model_deaths.predict([[numerical_date_december_2021]])[0]

print("Predicted Total Cases in December 2021:", int(predicted_total_cases))
print("Predicted Active Cases in December 2021:", int(predicted_active_cases))
print("Predicted Deaths in December 2021:", int(predicted_deaths))


Predicted Total Cases in December 2021: 33611948
Predicted Active Cases in December 2021: 1550284
Predicted Deaths in December 2021: 430994


