## pycart

In [None]:
# check installed version
import pycaret
pycaret.__version__

In [None]:
!pip install pycaret[models]

In [None]:
import pycaret
pycaret.__version__

In [None]:
# loading sample dataset from pycaret dataset module
from pycaret.datasets import get_data
data = get_data('diabetes')

## Setup
This function initializes the training environment and creates the transformation pipeline. Setup function must be called before executing any other function in PyCaret. It only has two required parameters i.e. data and target. All the other parameters are optional.

In [None]:
# import pycaret classification and init setup
from pycaret.classification import *
s = setup(data, target = 'Class variable', session_id = 123)

In [None]:
# import ClassificationExperiment and init the class
from pycaret.classification import ClassificationExperiment
exp = ClassificationExperiment()

In [None]:
# check the type of exp
type(exp)

In [None]:
# init setup on exp
exp.setup(data, target = 'Class variable', session_id = 123)

## Compare Models
This function trains and evaluates the performance of all the estimators available in the model library using cross-validation. The output of this function is a scoring grid with average cross-validated scores. Metrics evaluated during CV can be accessed using the get_metrics function. Custom metrics can be added or removed using add_metric and remove_metric function.

In [None]:
# compare baseline models
best = compare_models()


In [None]:
# compare models using OOP
exp.compare_models()

## Analyze Model
You can use the plot_model function to analyzes the performance of a trained model on the test set. It may require re-training the model in certain cases.

In [None]:
# plot confusion matrix
plot_model(best, plot = 'confusion_matrix')

In [None]:
# plot AUC
plot_model(best, plot = 'auc')

In [None]:
# plot feature importance
plot_model(best, plot = 'feature')

## Prediction
The predict_model function returns prediction_label and prediction_score (probability of the predicted class) as new columns in dataframe. When data is None (default), it uses the test set (created during the setup function) for scoring.

In [None]:
# predict on test set
holdout_pred = predict_model(best)

In [None]:
# show predictions df
holdout_pred.head()

## Save Model
Finally, you can save the entire pipeline on disk for later use, using pycaret's save_model function.

In [None]:
# save pipeline
save_model(best, 'my_first_pipeline')

In [None]:
# load pipeline
loaded_best_pipeline = load_model('my_first_pipeline')
loaded_best_pipeline

## Setup
This function initializes the experiment in PyCaret and creates the transformation pipeline based on all the parameters passed in the function. Setup function must be called before executing any other function. It takes two required parameters: data and target. All the other parameters are optional and are used for configuring data preprocessing pipeline.

In [None]:
# init setup function
s = setup(data, target = 'Class variable', session_id = 123)

In [None]:
# check all available config
get_config()

In [None]:
# lets access X_train_transformed
get_config('X_train_transformed')

In [None]:
# lets check the X_train_transformed to see effect of params passed
get_config('X_train_transformed')['Number of times pregnant'].hist()

In [None]:
get_config('X_train')['Number of times pregnant'].hist()