In [1]:
import pandas as pd
import numpy as np
from preprocessy.pipelines import StandardPipeline, BasePipeline
from sklearn.tree import DecisionTreeClassifier
from sklearn import metrics
import random
import time
import tracemalloc
from sklearn.pipeline import Pipeline
from sklearn.base import BaseEstimator, TransformerMixin
from sklearn.impute import SimpleImputer
from sklearn.preprocessing import StandardScaler
from sklearn.preprocessing import OneHotEncoder
from sklearn.model_selection import train_test_split
from sklearn.compose import ColumnTransformer
from sklearn.neighbors import LocalOutlierFactor
from sklearn.metrics import mean_squared_error  

In [3]:
df = pd.read_csv('census.csv')

In [4]:
df.shape

(199523, 42)

## Preprocessy

In [5]:
def test_preprocessy_pipeline(random_state):
    cat_cols = ['F2','F3','F4','F5','F7','F8','F9','F10','F11','F12','F13','F14','F15','F16','F20','F21','F22','F23','F24','F26','F27','F28','F29','F30','F31','F32','F33','F34','F35','F36','F37','F38','F39','F40','F41']
    cont_cols = ['F1','F6','F17','F18','F19','F25']
    params = {
        'target_label':"F42",
        'cat_cols':cat_cols.copy(),
        'test_size':0.2,
        'remove_outliers': False,
        'test_size':0.1,
        'shuffle':True,
        'random_state':random_state,
        'n_splits':2
    }
    p = StandardPipeline(train_df_path="census.csv", params=params)
    res = p.process()
    X_train = params['X_train'].drop(columns=cat_cols)
    X_test = params['X_test'].drop(columns=cat_cols)
    y_train = params['y_train']
    y_test = params['y_test']
    clf = DecisionTreeClassifier()
    clf = clf.fit(X_train,y_train)
    y_pred = clf.predict(X_test)
    return metrics.accuracy_score(y_test, y_pred)

In [6]:
average_time = []
average_mem = []
average_mse = []
for i in range(100):
    tracemalloc.start()
    begin = time.time()
    mse = test_preprocessy_pipeline(i)
    end = time.time()
    current,peak=tracemalloc.get_traced_memory()
    tracemalloc.clear_traces()
    tracemalloc.stop()
    average_time.append(end-begin)
    average_mem.append(peak)
    average_mse.append(mse)


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute, Train test split |
| Total Pipeline Stages | 7                                                                                     |
| Total Params          | 9                          



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.9s (1.42/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.1s (1.38/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.2s (1.34/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.2s (1.35/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.4s (1.60/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.4s (1.58/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.4s (1.59/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.4s (1.60/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.4s (1.58/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.4s (1.59/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.39/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.9s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.7s (1.48/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.39/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.8s (1.46/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.8s (1.47/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.7s (1.47/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.8s (1.46/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.40/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.7s (1.49/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.7s (1.49/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.7s (1.49/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.7s (1.49/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.7s (1.49/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.7s (1.49/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.7s (1.48/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.4s (1.61/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.4s (1.61/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.9s (1.42/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.7s (1.49/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.7s (1.49/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.1s (1.37/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.8s (1.45/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.8s (1.45/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.3s (1.33/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 6.5s (1.08/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.3s (1.31/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.1s (1.38/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.3s (1.32/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.7s (1.22/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 6.1s (1.16/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.1s (1.37/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.1s (1.38/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.9s (1.42/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.9s (1.44/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.8s (1.45/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.9s (1.44/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.1s (1.36/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.2s (1.35/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.5s (1.27/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 6.1s (1.15/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.9s (1.19/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.4s (1.30/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 6.3s (1.12/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.41/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.8s (1.20/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.8s (1.21/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.7s (1.24/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.1s (1.38/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.0s (1.39/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.4s (1.29/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.3s (1.33/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 6.3s (1.12/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 4.9s (1.44/s)

Pipeline Completed Successfully


Pipeline Class: StandardPipeline

+-----------------------+---------------------------------------------------------------------------------------+
| Pipeline Property     | Value                                                                                 |
+-----------------------+---------------------------------------------------------------------------------------+
| Train Dataframe Path  | ../datasets/classification/census.csv                                                 |
| Test Dataframe Path   | None                                                                                  |
| Config File Path      | None                                                                                  |
| Pipeline Stages       | Read file, Parse dataset, Execute, Encode, Handle outliers, Execute



==> Completed Stage: Execute
==> Completed Stage: Train test split
Pipeline Stages |████████████████████████████████████████| 7/7 [100%] in 5.2s (1.34/s)

Pipeline Completed Successfully



In [7]:
av_time,av_mem,av_mse = 0,0,0
for i in range(100):
    av_time += average_time[i]
    av_mem += average_mem[i]
    av_mse += average_mse[i]
print(av_time/100,(av_mem/100)/10**6,av_mse/100)

7.444659631252289 519.43007322 0.9295851792186873


## Pandas

In [9]:
def drop_columns(df,column_list):
    df = df.drop(columns=column_list)
    return df
def fill_missing_values(df,column_list):
   for col in column_list:
      df[col].dropna(inplace=True)
   return df
def encode_cols(df,column_list):
    for col in column_list:
        df[col + str("Encoded")] = pd.factorize(df[col])[0]
        df[col + str("Encoded")] = df[col + str("Encoded")].astype("category")
    return df

In [10]:
def test_pandas_pipeline(random_state):
    df = pd.read_csv('census.csv')
    cat_cols = ['F2','F3','F4','F5','F7','F8','F9','F10','F11','F12','F13','F14','F15','F16','F20','F21','F22','F23','F24','F26','F27','F28','F29','F30','F31','F32','F33','F34','F35','F36','F37','F38','F39','F40','F41']
    df_processed = (df.
                    pipe(fill_missing_values,["F12"]).
                    pipe(encode_cols, cat_cols.copy())
                   )
    X,y = df_processed.drop(columns=['F42']),df_processed.loc[:,'F42']
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.1, random_state=random_state)
    #return X_train, X_test, y_train, y_test
    X_train.drop(cat_cols,axis=1,inplace=True)
    X_test.drop(cat_cols,axis=1,inplace=True)
    clf = DecisionTreeClassifier()
    clf = clf.fit(X_train,y_train)
    y_pred = clf.predict(X_test)
    return metrics.accuracy_score(y_test, y_pred)

In [11]:
average_time = []
average_mem = []
average_mse = []
for i in range(100):
    tracemalloc.start()
    begin = time.time()
    mse = test_pandas_pipeline(i)
    end = time.time()
    current,peak=tracemalloc.get_traced_memory()
    tracemalloc.clear_traces()
    tracemalloc.stop()
    average_time.append(end-begin)
    average_mem.append(peak)
    average_mse.append(mse)

In [12]:
av_time,av_mem,av_mse = 0,0,0
for i in range(100):
    av_time += average_time[i]
    av_mem += average_mem[i]
    av_mse += average_mse[i]
print(av_time/100,(av_mem/100)/10**6,av_mse/100)

4.612936568260193 251.25219494 0.9295379140981307


## Sklearn

In [13]:
def test_sklearn_pipeline(random_state_num):
    numeric_features = ['F1','F6','F17','F18','F19','F25']
    categorical_features = ['F2','F3','F4','F5','F7','F8','F9','F10','F11','F12','F13','F14','F15','F16','F20','F21','F22','F23','F24','F26','F27','F28','F29','F30','F31','F32','F33','F34','F35','F36','F37','F38','F39','F40','F41']
    missing_features = ["F12"]
    categorical_transformer = Pipeline(
        steps=[('ohe',OneHotEncoder(handle_unknown="ignore"))]
    )
    numeric_transformer = Pipeline(
        steps=[("imputer", SimpleImputer(strategy="mean")),("scaler", StandardScaler())]
    )
    preprocessor = ColumnTransformer(
        transformers=[
            ('num',numeric_transformer,numeric_features),
            ("cat", categorical_transformer, categorical_features),
        ]
    )
    clf = Pipeline(
        steps=[("preprocessor", preprocessor), ("classifier", DecisionTreeClassifier())]
    )
    df = pd.read_csv('census.csv')
    X,y = df.drop(columns=['F42']),df.loc[:,'F42']
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.1, random_state=random_state_num)
    clf.fit(X_train, y_train)
    y_pred = clf.predict(X_test) 
    return metrics.accuracy_score(y_test,y_pred)

In [14]:
average_time = []
average_mem = []
average_mse = []
for i in range(100):
    tracemalloc.start()
    begin = time.time()
    mse = test_sklearn_pipeline(i)
    end = time.time()
    current,peak=tracemalloc.get_traced_memory()
    tracemalloc.clear_traces()
    tracemalloc.stop()
    average_time.append(end-begin)
    average_mem.append(peak)
    average_mse.append(mse)

In [15]:
av_time,av_mem,av_mse = 0,0,0
for i in range(100):
    av_time += average_time[i]
    av_mem += average_mem[i]
    av_mse += average_mse[i]
print(av_time/100,(av_mem/100)/10**6,av_mse/100)

38.31784860610962 550.17933483 0.9340830952738934
