# <span style="color: #b0f542">Task 1: COVID-19 Risk Classification </span>

### **Objective**
Predict whether an individual is likely to contract COVID-19 using the provided dataset.

### **Requirements**
- Use **Random Forest Classifier** and **Gradient Boosted Classifier** to build predictive models.
- Evaluate the models and provide **comparative insights** into their performance.
- Analyze **feature importance** and discuss the **practical implications** of the models.


In [108]:
import pandas as pd

from notebooks.assignment_2 import X_test

In [109]:
covid_ds = pd.read_csv(filepath_or_buffer="datasets/coronavirusdataset.csv")

In [110]:
covid_ds.head(5)

Unnamed: 0,batch_date,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,...,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat,cxr_findings,cxr_impression,cxr_label,cxr_link
0,2020-10-20,"SARS-CoV-2, NAA",Nasal,Negative,39,False,,False,False,False,...,False,False,False,False,False,False,,,,
1,2020-10-20,COVID-19 PCR External Result,Nasal,Negative,56,False,,False,False,False,...,False,False,False,False,False,False,,,,
2,2020-10-20,Rapid COVID-19 PCR Test,Nasal,Negative,35,False,,False,False,False,...,False,False,False,False,False,False,,,,
3,2020-10-20,Rapid COVID-19 PCR Test,Nasal,Negative,37,False,,False,False,False,...,False,False,False,False,False,False,,,,
4,2020-10-20,Rapid COVID-19 PCR Test,Nasal,Negative,42,False,,False,False,False,...,False,False,False,False,False,False,,,,


In [111]:
covid_ds

Unnamed: 0,batch_date,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,...,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat,cxr_findings,cxr_impression,cxr_label,cxr_link
0,2020-10-20,"SARS-CoV-2, NAA",Nasal,Negative,39,False,,False,False,False,...,False,False,False,False,False,False,,,,
1,2020-10-20,COVID-19 PCR External Result,Nasal,Negative,56,False,,False,False,False,...,False,False,False,False,False,False,,,,
2,2020-10-20,Rapid COVID-19 PCR Test,Nasal,Negative,35,False,,False,False,False,...,False,False,False,False,False,False,,,,
3,2020-10-20,Rapid COVID-19 PCR Test,Nasal,Negative,37,False,,False,False,False,...,False,False,False,False,False,False,,,,
4,2020-10-20,Rapid COVID-19 PCR Test,Nasal,Negative,42,False,,False,False,False,...,False,False,False,False,False,False,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
7289,2020-10-20,COVID-19 PCR External Result,Nasal,Negative,26,False,,False,False,False,...,False,False,False,False,False,False,,,,
7290,2020-10-20,"SARS-CoV-2, NAA",Nasal,Negative,29,False,False,False,False,False,...,False,False,False,False,False,False,,,,
7291,2020-10-20,"SARS-CoV-2, NAA",Nasal,Negative,33,False,,False,False,False,...,False,False,False,False,False,False,,,,
7292,2020-10-20,Rapid COVID-19 PCR Test,Nasal,Negative,46,False,False,False,False,False,...,False,False,False,False,False,False,,,,


In [112]:
covid_ds.columns

Index(['batch_date', 'test_name', 'swab_type', 'covid19_test_results', 'age',
       'high_risk_exposure_occupation', 'high_risk_interactions', 'diabetes',
       'chd', 'htn', 'cancer', 'asthma', 'copd', 'autoimmune_dis', 'smoker',
       'temperature', 'pulse', 'sys', 'dia', 'rr', 'sats', 'rapid_flu_results',
       'rapid_strep_results', 'ctab', 'labored_respiration', 'rhonchi',
       'wheezes', 'days_since_symptom_onset', 'cough', 'cough_severity',
       'fever', 'sob', 'sob_severity', 'diarrhea', 'fatigue', 'headache',
       'loss_of_smell', 'loss_of_taste', 'runny_nose', 'muscle_sore',
       'sore_throat', 'cxr_findings', 'cxr_impression', 'cxr_label',
       'cxr_link'],
      dtype='object')

## <span style="color:#b0f542">1.1 Feature Engineering</span>
Removing the batch date column since each datapoint is 2020-10-20

In [113]:
covid_ds = covid_ds.drop('batch_date', axis=1)

In [114]:
covid_ds.tail(4)

Unnamed: 0,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,cancer,...,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat,cxr_findings,cxr_impression,cxr_label,cxr_link
7290,"SARS-CoV-2, NAA",Nasal,Negative,29,False,False,False,False,False,False,...,False,False,False,False,False,False,,,,
7291,"SARS-CoV-2, NAA",Nasal,Negative,33,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
7292,Rapid COVID-19 PCR Test,Nasal,Negative,46,False,False,False,False,False,False,...,False,False,False,False,False,False,,,,
7293,Rapid COVID-19 PCR Test,Nasal,Negative,53,False,,False,False,True,False,...,False,False,False,False,False,False,,,,


imputing the high_risk_exposure_occupation missing values with the modal value i.e "False"

In [115]:
covid_ds['high_risk_exposure_occupation'] = covid_ds['high_risk_exposure_occupation'].apply(lambda x: False if pd.isna(x) else x)

In [116]:
covid_ds.sample(5)

Unnamed: 0,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,cancer,...,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat,cxr_findings,cxr_impression,cxr_label,cxr_link
2648,Rapid COVID-19 PCR Test,Nasal,Negative,56,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
6673,Rapid COVID-19 PCR Test,Nasal,Negative,56,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
252,"SARS-CoV-2, NAA",Nasal,Negative,31,False,False,False,False,False,False,...,False,False,False,False,False,False,,,,
3993,"SARS-CoV-2, NAA",Nasal,Negative,35,False,True,False,False,False,False,...,False,False,False,False,False,False,,,,
42,Rapid COVID-19 PCR Test,Nasal,Negative,64,False,,False,False,False,False,...,False,False,False,False,False,False,,,,


below we impute the columns 'sats',
    'temperature',
     missing values with their respective mode

In [117]:
cols = [
    'sats',
    'temperature',
]

for c in cols:
    covid_ds[c] = covid_ds[c].fillna(covid_ds[c].mean())


In [118]:
covid_ds.sample(5)

Unnamed: 0,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,cancer,...,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat,cxr_findings,cxr_impression,cxr_label,cxr_link
6780,Rapid COVID-19 PCR Test,Nasal,Negative,37,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
4743,Rapid COVID-19 PCR Test,Nasal,Negative,18,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
2525,Rapid COVID-19 PCR Test,Nasal,Negative,25,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
5925,COVID-19 PCR External Result,Nasal,Negative,58,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
2412,COVID-19 PCR External Result,Nasal,Negative,56,False,,False,False,False,False,...,False,False,False,False,False,False,,,,


removing 'cough_severity',
    'sob_severity',
    'days_since_symptom_onset' columns due to too few data points despite their relative importance

In [119]:
covid_ds = covid_ds.drop(['cough_severity',
    'sob_severity',
    'days_since_symptom_onset'], axis=1)
covid_ds

Unnamed: 0,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,cancer,...,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat,cxr_findings,cxr_impression,cxr_label,cxr_link
0,"SARS-CoV-2, NAA",Nasal,Negative,39,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
1,COVID-19 PCR External Result,Nasal,Negative,56,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
2,Rapid COVID-19 PCR Test,Nasal,Negative,35,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
3,Rapid COVID-19 PCR Test,Nasal,Negative,37,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
4,Rapid COVID-19 PCR Test,Nasal,Negative,42,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
7289,COVID-19 PCR External Result,Nasal,Negative,26,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
7290,"SARS-CoV-2, NAA",Nasal,Negative,29,False,False,False,False,False,False,...,False,False,False,False,False,False,,,,
7291,"SARS-CoV-2, NAA",Nasal,Negative,33,False,,False,False,False,False,...,False,False,False,False,False,False,,,,
7292,Rapid COVID-19 PCR Test,Nasal,Negative,46,False,False,False,False,False,False,...,False,False,False,False,False,False,,,,


In [120]:
covid_ds.columns

Index(['test_name', 'swab_type', 'covid19_test_results', 'age',
       'high_risk_exposure_occupation', 'high_risk_interactions', 'diabetes',
       'chd', 'htn', 'cancer', 'asthma', 'copd', 'autoimmune_dis', 'smoker',
       'temperature', 'pulse', 'sys', 'dia', 'rr', 'sats', 'rapid_flu_results',
       'rapid_strep_results', 'ctab', 'labored_respiration', 'rhonchi',
       'wheezes', 'cough', 'fever', 'sob', 'diarrhea', 'fatigue', 'headache',
       'loss_of_smell', 'loss_of_taste', 'runny_nose', 'muscle_sore',
       'sore_throat', 'cxr_findings', 'cxr_impression', 'cxr_label',
       'cxr_link'],
      dtype='object')

removing the following columns due to too few datapoints relative to their importance in making a covid diagnosis:
'rapid_flu_results','rapid_strep_results', 'cxr_link''rapid_flu_results', 'rapid_strep_results', 'ctab', 'rr', 'sys', 'dia',  'cxr_findings', 'cxr_impression', 'cxr_label','wheezes'

In [121]:
covid_ds= covid_ds.drop(['rapid_flu_results','rapid_strep_results', 'cxr_link','rapid_flu_results', 'rapid_strep_results', 'ctab', 'rr', 'sys', 'dia',  'cxr_findings', 'cxr_impression', 'cxr_label','wheezes'], axis= 1)

In [122]:
covid_ds = covid_ds.drop(['rhonchi', 'labored_respiration'], axis=1)

In [123]:
covid_ds.columns

Index(['test_name', 'swab_type', 'covid19_test_results', 'age',
       'high_risk_exposure_occupation', 'high_risk_interactions', 'diabetes',
       'chd', 'htn', 'cancer', 'asthma', 'copd', 'autoimmune_dis', 'smoker',
       'temperature', 'pulse', 'sats', 'cough', 'fever', 'sob', 'diarrhea',
       'fatigue', 'headache', 'loss_of_smell', 'loss_of_taste', 'runny_nose',
       'muscle_sore', 'sore_throat'],
      dtype='object')

In [124]:
covid_ds

Unnamed: 0,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,cancer,...,fever,sob,diarrhea,fatigue,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat
0,"SARS-CoV-2, NAA",Nasal,Negative,39,False,,False,False,False,False,...,,False,False,False,False,False,False,False,False,False
1,COVID-19 PCR External Result,Nasal,Negative,56,False,,False,False,False,False,...,,False,False,False,False,False,False,False,False,False
2,Rapid COVID-19 PCR Test,Nasal,Negative,35,False,,False,False,False,False,...,,False,False,False,False,False,False,False,False,False
3,Rapid COVID-19 PCR Test,Nasal,Negative,37,False,,False,False,False,False,...,,False,False,False,False,False,False,False,False,False
4,Rapid COVID-19 PCR Test,Nasal,Negative,42,False,,False,False,False,False,...,,False,False,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
7289,COVID-19 PCR External Result,Nasal,Negative,26,False,,False,False,False,False,...,,False,False,False,False,False,False,False,False,False
7290,"SARS-CoV-2, NAA",Nasal,Negative,29,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7291,"SARS-CoV-2, NAA",Nasal,Negative,33,False,,False,False,False,False,...,,False,False,False,False,False,False,False,False,False
7292,Rapid COVID-19 PCR Test,Nasal,Negative,46,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False


removing fever since temperature is already covered

In [125]:
covid_ds = covid_ds.drop('fever', axis=1)

In [126]:
covid_ds

Unnamed: 0,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,cancer,...,cough,sob,diarrhea,fatigue,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat
0,"SARS-CoV-2, NAA",Nasal,Negative,39,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
1,COVID-19 PCR External Result,Nasal,Negative,56,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
2,Rapid COVID-19 PCR Test,Nasal,Negative,35,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
3,Rapid COVID-19 PCR Test,Nasal,Negative,37,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
4,Rapid COVID-19 PCR Test,Nasal,Negative,42,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
7289,COVID-19 PCR External Result,Nasal,Negative,26,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7290,"SARS-CoV-2, NAA",Nasal,Negative,29,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7291,"SARS-CoV-2, NAA",Nasal,Negative,33,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7292,Rapid COVID-19 PCR Test,Nasal,Negative,46,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False


imputing missing pulse values with the average due to its relative importance

In [127]:
covid_ds['pulse'] = covid_ds['pulse'].fillna(covid_ds['pulse'].mean())
covid_ds

Unnamed: 0,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,cancer,...,cough,sob,diarrhea,fatigue,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat
0,"SARS-CoV-2, NAA",Nasal,Negative,39,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
1,COVID-19 PCR External Result,Nasal,Negative,56,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
2,Rapid COVID-19 PCR Test,Nasal,Negative,35,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
3,Rapid COVID-19 PCR Test,Nasal,Negative,37,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
4,Rapid COVID-19 PCR Test,Nasal,Negative,42,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
7289,COVID-19 PCR External Result,Nasal,Negative,26,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7290,"SARS-CoV-2, NAA",Nasal,Negative,29,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7291,"SARS-CoV-2, NAA",Nasal,Negative,33,False,,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7292,Rapid COVID-19 PCR Test,Nasal,Negative,46,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False


imputing missing values in the high_risk_interactions columns with the mode

In [128]:
covid_ds['high_risk_interactions'] = covid_ds['high_risk_interactions'].fillna(False)
covid_ds

  covid_ds['high_risk_interactions'] = covid_ds['high_risk_interactions'].fillna(False)


Unnamed: 0,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,cancer,...,cough,sob,diarrhea,fatigue,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat
0,"SARS-CoV-2, NAA",Nasal,Negative,39,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
1,COVID-19 PCR External Result,Nasal,Negative,56,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
2,Rapid COVID-19 PCR Test,Nasal,Negative,35,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
3,Rapid COVID-19 PCR Test,Nasal,Negative,37,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
4,Rapid COVID-19 PCR Test,Nasal,Negative,42,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
7289,COVID-19 PCR External Result,Nasal,Negative,26,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7290,"SARS-CoV-2, NAA",Nasal,Negative,29,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7291,"SARS-CoV-2, NAA",Nasal,Negative,33,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7292,Rapid COVID-19 PCR Test,Nasal,Negative,46,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False


## <span style="color:#b0f542;">1.2 Feature Encoding</span>

test_name encoding

In [129]:
from sklearn import preprocessing
encoder = preprocessing.LabelEncoder()

In [130]:
covid_ds['test_name'] = encoder.fit_transform(covid_ds['test_name'])

In [131]:
covid_ds

Unnamed: 0,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,cancer,...,cough,sob,diarrhea,fatigue,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat
0,5,Nasal,Negative,39,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
1,0,Nasal,Negative,56,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
2,2,Nasal,Negative,35,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
3,2,Nasal,Negative,37,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
4,2,Nasal,Negative,42,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
7289,0,Nasal,Negative,26,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7290,5,Nasal,Negative,29,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7291,5,Nasal,Negative,33,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7292,2,Nasal,Negative,46,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False


swab_type encoding

In [132]:
covid_ds['swab_type'] = encoder.fit_transform(covid_ds['swab_type'])

In [133]:
covid_ds

Unnamed: 0,test_name,swab_type,covid19_test_results,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,cancer,...,cough,sob,diarrhea,fatigue,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat
0,5,1,Negative,39,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
1,0,1,Negative,56,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
2,2,1,Negative,35,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
3,2,1,Negative,37,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
4,2,1,Negative,42,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
7289,0,1,Negative,26,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7290,5,1,Negative,29,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7291,5,1,Negative,33,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
7292,2,1,Negative,46,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False


## <span style="color:#b0f542;">2. Model Training</span>

In [135]:
from sklearn.model_selection import train_test_split
X = covid_ds.drop('covid19_test_results', axis=1)
y = covid_ds['covid19_test_results']

In [136]:
X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=42)

In [137]:
X_train

Unnamed: 0,test_name,swab_type,age,high_risk_exposure_occupation,high_risk_interactions,diabetes,chd,htn,cancer,asthma,...,cough,sob,diarrhea,fatigue,headache,loss_of_smell,loss_of_taste,runny_nose,muscle_sore,sore_throat
5317,2,1,45,False,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
5866,0,1,35,False,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
4447,0,1,70,False,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
3208,0,1,57,False,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
6171,2,1,36,False,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5191,5,1,47,False,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
5226,5,1,42,False,True,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
5390,0,0,72,False,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False
860,5,1,40,False,False,False,False,False,False,False,...,False,False,False,False,False,False,False,False,False,False


In [138]:
y

0       Negative
1       Negative
2       Negative
3       Negative
4       Negative
          ...   
7289    Negative
7290    Negative
7291    Negative
7292    Negative
7293    Negative
Name: covid19_test_results, Length: 7294, dtype: object