In [None]:
import numpy as np 
import pandas as pd
from dateutil.parser import parse
from typing import List
import matplotlib.pyplot as plt
import seaborn as sns

# Introduction

I wanted to look at a lightGBM model with Pycaret and see what could be done with that. This notebook is a pretty quick rundown of my attempt to use Pycaret and Lightgbm rather than something all that educational but I am sharing it in the hope it might either help someone do similar attempts or save someone some time. 

In [None]:
df = pd.read_csv("../input/tabular-playground-series-feb-2022/train.csv")
df.head()

# Use Pycaret to Find the Best Model

In [None]:
!pip install pycaret

In [None]:
from pycaret.classification import *

setup(data = df.drop("row_id", axis=1).copy(), 
             target = "target",
             numeric_imputation = 'mean',
             silent = True, normalize = True, session_id=42, fix_imbalance=True)
display()

In [None]:
model = create_model('lightgbm')

# Use the Best Model

In [None]:
model

In [None]:
predict_model(model);

# Look at Model Metrics

In [None]:
plot_model(model, plot = 'error')

In [None]:
plot_model(model, plot = 'boundary')

In [None]:
plot_model(model, plot = 'feature')

# Train Model on Full Dataset

In [None]:
final_model = finalize_model(model)

In [None]:
predict_model(model);

# Create Submission

In [None]:
test_data = pd.read_csv("../input/tabular-playground-series-feb-2022/test.csv")
test_data.drop(columns="row_id", inplace=True)
predictions = predict_model(final_model, data=test_data)
predictions.head()

In [None]:
submissiondf = pd.read_csv("../input/tabular-playground-series-feb-2022/sample_submission.csv")
submissiondf["target"] = predictions.Label
submissiondf.head()

In [None]:
submissiondf.to_csv("submission.csv", index=False)