In [1]:
import pandas as pd
from lazypredict.Supervised import LazyClassifier
from sklearn.model_selection import train_test_split

# Load the datasets
features_df = pd.read_csv("data/training_set_features.csv", index_col="respondent_id")
labels_df = pd.read_csv("data/training_set_labels.csv", index_col="respondent_id")

# Verify the loaded data
print("Features DataFrame:")
print(features_df.head())
print("\nLabels DataFrame:")
print(labels_df.head())

# Features and targets
features = features_df
target_h1n1 = labels_df['h1n1_vaccine']
target_seasonal = labels_df['seasonal_vaccine']

# Split the data for h1n1_vaccine
X_train_h1n1, X_test_h1n1, y_train_h1n1, y_test_h1n1 = train_test_split(features, target_h1n1, test_size=0.2, random_state=42)

# Initialize LazyClassifier for h1n1_vaccine
clf_h1n1 = LazyClassifier(verbose=0, ignore_warnings=True, custom_metric=None)
models_h1n1, predictions_h1n1 = clf_h1n1.fit(X_train_h1n1, X_test_h1n1, y_train_h1n1, y_test_h1n1)

print("H1N1 Vaccine Models:")
print(models_h1n1)

# Split the data for seasonal_vaccine
X_train_seasonal, X_test_seasonal, y_train_seasonal, y_test_seasonal = train_test_split(features, target_seasonal, test_size=0.2, random_state=42)

# Initialize LazyClassifier for seasonal_vaccine
clf_seasonal = LazyClassifier(verbose=0, ignore_warnings=True, custom_metric=None)
models_seasonal, predictions_seasonal = clf_seasonal.fit(X_train_seasonal, X_test_seasonal, y_train_seasonal, y_test_seasonal)

print("Seasonal Vaccine Models:")
print(models_seasonal)


  0%|          | 0/29 [00:00<?, ?it/s]

Features DataFrame:
               h1n1_concern  h1n1_knowledge  behavioral_antiviral_meds  \
respondent_id                                                            
0                      1.00            0.00                       0.00   
1                      3.00            2.00                       0.00   
2                      1.00            1.00                       0.00   
3                      1.00            1.00                       0.00   
4                      2.00            1.00                       0.00   

               behavioral_avoidance  behavioral_face_mask  \
respondent_id                                               
0                              0.00                  0.00   
1                              1.00                  0.00   
2                              1.00                  0.00   
3                              1.00                  0.00   
4                              1.00                  0.00   

               behavioral_wash_ha

100%|██████████| 29/29 [02:53<00:00,  5.97s/it]
  0%|          | 0/29 [00:00<?, ?it/s]

H1N1 Vaccine Models:
                               Accuracy  Balanced Accuracy  ROC AUC  F1 Score  \
Model                                                                           
LGBMClassifier                     0.86               0.73     0.73      0.85   
XGBClassifier                      0.85               0.73     0.73      0.84   
AdaBoostClassifier                 0.85               0.72     0.72      0.84   
GaussianNB                         0.75               0.71     0.71      0.77   
BernoulliNB                        0.80               0.71     0.71      0.80   
LinearDiscriminantAnalysis         0.84               0.70     0.70      0.82   
BaggingClassifier                  0.84               0.70     0.70      0.83   
RandomForestClassifier             0.85               0.69     0.69      0.83   
CalibratedClassifierCV             0.84               0.69     0.69      0.82   
ExtraTreesClassifier               0.85               0.68     0.68      0.83   
RidgeCl

100%|██████████| 29/29 [03:35<00:00,  7.44s/it]

Seasonal Vaccine Models:
                               Accuracy  Balanced Accuracy  ROC AUC  F1 Score  \
Model                                                                           
LGBMClassifier                     0.79               0.79     0.79      0.79   
SVC                                0.79               0.79     0.79      0.79   
AdaBoostClassifier                 0.79               0.78     0.78      0.79   
NuSVC                              0.78               0.78     0.78      0.78   
RandomForestClassifier             0.78               0.78     0.78      0.78   
RidgeClassifierCV                  0.78               0.78     0.78      0.78   
LinearDiscriminantAnalysis         0.78               0.78     0.78      0.78   
RidgeClassifier                    0.78               0.78     0.78      0.78   
CalibratedClassifierCV             0.78               0.78     0.78      0.78   
ExtraTreesClassifier               0.78               0.78     0.78      0.78   
XGB


