In [40]:
%matplotlib inline
%load_ext autoreload
%autoreload 2

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


In [41]:
import os
import warnings
warnings.filterwarnings('ignore')
os.environ["PYTHONWARNINGS"] = "ignore"

In [42]:
cur_folder_name = os.getcwd().split('/')[-1]
if cur_folder_name != "fairness-variance":
    os.chdir("../..")

print('Current location: ', os.getcwd())

Current location:  /home/denys_herasymuk/UCU/4course_2term/Bachelor_Thesis/Code/fairness-variance


## Import dependencies

In [43]:
import os
import pandas as pd
from datetime import datetime, timezone

from configs.models_config_for_tuning import MODELS_CONFIG
from source.utils.custom_initializers import create_config_obj, create_models_config_from_tuned_params_df
from source.user_interfaces.metrics_computation_interfaces import compute_metrics_multiple_runs
from source.custom_classes.data_loaders import ACSEmploymentDataset

## Configs

In [44]:
config = create_config_obj(config_yaml_path=os.path.join('configs', 'experiment1_folktables_GA_2018_config.yaml'))

TUNED_PARAMS_FILE_PATH = os.path.join('results', 'models_tuning', f'tuning_results_{config.dataset_name}_20230117__023240.csv')
SAVE_RESULTS_DIR_PATH = os.path.join('results', 'hypothesis_space',
                                     f'{config.dataset_name}_Metrics_{datetime.now(timezone.utc).strftime("%Y%m%d__%H%M%S")}')

## Models tuned hyper-parameters

In [45]:
models_tuned_params_df = pd.read_csv(TUNED_PARAMS_FILE_PATH)
models_tuned_params_df

Unnamed: 0.1,Unnamed: 0,Dataset_Name,Model_Name,F1_Score,Accuracy_Score,Model_Best_Params
0,0,Folktables_GA_2018,LogisticRegression,0.8195,0.8203,"{'C': 1, 'max_iter': 150, 'penalty': 'l2', 'so..."
1,1,Folktables_GA_2018,DecisionTreeClassifier,0.8304,0.8313,"{'criterion': 'gini', 'max_depth': 10, 'max_fe..."
2,2,Folktables_GA_2018,RandomForestClassifier,0.8354,0.8357,"{'max_depth': 10, 'max_features': 0.6, 'min_sa..."
3,3,Folktables_GA_2018,XGBClassifier,0.8371,0.8375,"{'lambda': 1, 'learning_rate': 0.1, 'max_depth..."
4,4,Folktables_GA_2018,KNeighborsClassifier,0.8136,0.8137,"{'metric': 'minkowski', 'n_neighbors': 25, 'we..."
5,5,Folktables_GA_2018,MLPClassifier,0.8345,0.8353,"{'activation': 'logistic', 'hidden_layer_sizes..."


In [46]:
experiment_models_config = create_models_config_from_tuned_params_df(
    models_config_for_tuning=MODELS_CONFIG,
    models_tuned_params_df=models_tuned_params_df,
)

In [47]:
experiment_models_config.keys()

dict_keys(['DecisionTreeClassifier', 'LogisticRegression', 'RandomForestClassifier', 'XGBClassifier', 'KNeighborsClassifier'])

## Load dataset

In [48]:
dataset = ACSEmploymentDataset(state=['GA'], year=2018, root_dir=os.path.join('data'), with_nulls=False, subsample=20000)
dataset.X_data.head()

Unnamed: 0,MAR,MIL,ESP,MIG,DREM,NATIVITY,DIS,DEAR,DEYE,SEX,RAC1P,RELP,CIT,ANC,SCHL,AGEP
83782,5,0,7,1,2,1,2,2,2,2,1,2,1,1,11,15
62505,1,4,0,3,2,2,2,2,2,1,6,0,5,1,21,29
27600,1,4,0,1,2,2,2,2,2,2,2,1,5,1,19,39
36286,1,4,0,1,2,1,2,2,2,1,1,0,1,1,21,56
40527,5,4,0,1,2,1,2,2,2,2,1,0,1,1,19,44


## Run experiments

In [49]:
multiple_runs_metrics_dct = compute_metrics_multiple_runs(dataset, config, experiment_models_config, SAVE_RESULTS_DIR_PATH, debug_mode=False)

Analyze models in one run:   0%|          | 0/5 [00:00<?, ?it/s]2023-01-24 01:44:04 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap


##############################  [Model 1 / 5] Analyze DecisionTreeClassifier  ##############################
Model random_state:  101
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:00<00:00, 27.05it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:00<00:00, 30.74it/s][A
2023-01-24 01:44:04 abstract_overall_variance_analyzer.py INFO    : Successfully tested classifiers by bootstrap






2023-01-24 01:44:05 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.822
Mean: 0.5412
Std: 0.0503
IQR: 0.0506
Entropy: 0.0
Jitter: 0.0408
Per sample accuracy: 0.8203
Label stability: 0.9448




Analyze models in one run:  20%|██        | 1/5 [00:03<00:13,  3.49s/it]2023-01-24 01:44:07 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 2 / 5] Analyze LogisticRegression  ##############################
Model random_state:  102
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:06,  1.45it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:01<00:05,  1.50it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:01<00:04,  1.74it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:02<00:03,  1.90it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:02<00:02,  1.85it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:03<00:02,  1.91it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:03<00:01,  2.01it/s][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:04<00:00,  2.08it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:04<00:00,  2.13it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:05<00:00,  1.95it/s][A
2023-01-24 01:44:12 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:44:13 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.821
Mean: 0.5588
Std: 0.0233
IQR: 0.0279
Entropy: 0.0
Jitter: 0.0364
Per sample accuracy: 0.819
Label stability: 0.9522




Analyze models in one run:  40%|████      | 2/5 [00:11<00:18,  6.18s/it]2023-01-24 01:44:15 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 3 / 5] Analyze RandomForestClassifier  ##############################
Model random_state:  103
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:01<00:14,  1.59s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:03<00:12,  1.62s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:05<00:12,  1.79s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:07<00:11,  1.85s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:08<00:09,  1.81s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:10<00:07,  1.79s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:12<00:05,  1.96s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:14<00:03,  1.97s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:16<00:01,  1.93s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:18<00:00,  1.84s/it][A
2023-01-24 01:44:34 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:44:34 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8282
Mean: 0.5447
Std: 0.0332
IQR: 0.0403
Entropy: 0.0
Jitter: 0.0412
Per sample accuracy: 0.824
Label stability: 0.9456




Analyze models in one run:  60%|██████    | 3/5 [00:34<00:27, 13.70s/it]2023-01-24 01:44:38 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 4 / 5] Analyze XGBClassifier  ##############################
Model random_state:  104
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:02<00:23,  2.67s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:04<00:17,  2.21s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:08<00:20,  2.89s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:12<00:20,  3.40s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:14<00:15,  3.03s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:16<00:10,  2.65s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:19<00:08,  2.70s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:21<00:05,  2.56s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:25<00:03,  3.06s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:28<00:00,  2.82s/it][A
2023-01-24 01:45:06 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:45:07 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.831
Mean: 0.5443999767303467
Std: 0.029400000348687172
IQR: 0.0351
Entropy: 0.0
Jitter: 0.0341
Per sample accuracy: 0.8281
Label stability: 0.956




Analyze models in one run:  80%|████████  | 4/5 [01:05<00:20, 20.80s/it]2023-01-24 01:45:10 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 5 / 5] Analyze KNeighborsClassifier  ##############################
Model random_state:  None
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:01,  5.90it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:00<00:01,  5.24it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:00<00:01,  4.24it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:00<00:01,  4.22it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:01<00:01,  4.21it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:01<00:00,  4.13it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:01<00:00,  4.17it/s][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:01<00:00,  4.20it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:02<00:00,  4.03it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:02<00:00,  4.02it/s][A
2023-01-24 01:45:12 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:45:13 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8128
Mean: 0.5229
Std: 0.0672
IQR: 0.0805
Entropy: 0.0
Jitter: 0.0821
Per sample accuracy: 0.8032
Label stability: 0.8939




Analyze models in one run: 100%|██████████| 5/5 [01:11<00:00, 14.38s/it]








Analyze models in one run:   0%|          | 0/5 [00:00<?, ?it/s]2023-01-24 01:45:16 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap


##############################  [Model 1 / 5] Analyze DecisionTreeClassifier  ##############################
Model random_state:  201
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:00<00:00, 27.75it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:00<00:00, 31.56it/s][A
2023-01-24 01:45:16 abstract_overall_variance_analyzer.py INFO    : Successfully tested classifiers by bootstrap






2023-01-24 01:45:17 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8242
Mean: 0.5579
Std: 0.0516
IQR: 0.0606
Entropy: 0.0
Jitter: 0.0505
Per sample accuracy: 0.8214
Label stability: 0.932




Analyze models in one run:  20%|██        | 1/5 [00:03<00:13,  3.45s/it]2023-01-24 01:45:19 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 2 / 5] Analyze LogisticRegression  ##############################
Model random_state:  202
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:04,  2.09it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:01<00:04,  1.80it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:01<00:04,  1.71it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:02<00:03,  1.64it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:02<00:03,  1.61it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:03<00:02,  1.56it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:04<00:01,  1.61it/s][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:04<00:01,  1.53it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:05<00:00,  1.66it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:05<00:00,  1.67it/s][A
2023-01-24 01:45:25 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:45:26 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8102
Mean: 0.5515
Std: 0.0221
IQR: 0.0269
Entropy: 0.045
Jitter: 0.0328
Per sample accuracy: 0.8095
Label stability: 0.9568




Analyze models in one run:  40%|████      | 2/5 [00:12<00:20,  6.79s/it]2023-01-24 01:45:28 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 3 / 5] Analyze RandomForestClassifier  ##############################
Model random_state:  203
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:01<00:13,  1.49s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:02<00:11,  1.45s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:04<00:10,  1.44s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:05<00:09,  1.50s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:07<00:07,  1.51s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:09<00:06,  1.53s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:10<00:04,  1.57s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:12<00:03,  1.68s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:14<00:01,  1.64s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:16<00:00,  1.61s/it][A
2023-01-24 01:45:44 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:45:45 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.841
Mean: 0.5465
Std: 0.0315
IQR: 0.0374
Entropy: 0.0
Jitter: 0.0305
Per sample accuracy: 0.8378
Label stability: 0.9613




Analyze models in one run:  60%|██████    | 3/5 [00:32<00:25, 12.60s/it]2023-01-24 01:45:48 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 4 / 5] Analyze XGBClassifier  ##############################
Model random_state:  204
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:02<00:18,  2.05s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:05<00:22,  2.75s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:07<00:16,  2.35s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:08<00:12,  2.11s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:11<00:11,  2.30s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:13<00:08,  2.16s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:18<00:09,  3.02s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:20<00:05,  2.67s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:24<00:03,  3.04s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:25<00:00,  2.59s/it][A
2023-01-24 01:46:14 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:46:15 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.835
Mean: 0.5577999949455261
Std: 0.0284000001847744
IQR: 0.0332
Entropy: 0.0
Jitter: 0.0296
Per sample accuracy: 0.8328
Label stability: 0.9624




Analyze models in one run:  80%|████████  | 4/5 [01:01<00:19, 19.27s/it]2023-01-24 01:46:17 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 5 / 5] Analyze KNeighborsClassifier  ##############################
Model random_state:  None
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:02,  3.95it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:00<00:01,  4.17it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:00<00:01,  4.03it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:00<00:01,  4.21it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:01<00:01,  3.91it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:01<00:01,  3.50it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:01<00:00,  3.31it/s][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:02<00:00,  3.49it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:02<00:00,  3.51it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:02<00:00,  3.52it/s][A
2023-01-24 01:46:20 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:46:21 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.7985
Mean: 0.5187
Std: 0.0685
IQR: 0.0827
Entropy: 0.1199
Jitter: 0.0876
Per sample accuracy: 0.7909
Label stability: 0.8848




Analyze models in one run: 100%|██████████| 5/5 [01:07<00:00, 13.55s/it]








Analyze models in one run:   0%|          | 0/5 [00:00<?, ?it/s]2023-01-24 01:46:23 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap


##############################  [Model 1 / 5] Analyze DecisionTreeClassifier  ##############################
Model random_state:  301
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:00<00:00, 33.49it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:00<00:00, 34.13it/s][A
2023-01-24 01:46:24 abstract_overall_variance_analyzer.py INFO    : Successfully tested classifiers by bootstrap






2023-01-24 01:46:24 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8168
Mean: 0.5589
Std: 0.0535
IQR: 0.0584
Entropy: 0.0
Jitter: 0.0462
Per sample accuracy: 0.8112
Label stability: 0.9428




Analyze models in one run:  20%|██        | 1/5 [00:03<00:13,  3.37s/it]2023-01-24 01:46:27 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 2 / 5] Analyze LogisticRegression  ##############################
Model random_state:  302
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:03,  2.27it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:00<00:03,  2.13it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:01<00:03,  1.99it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:02<00:03,  1.92it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:02<00:03,  1.64it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:03<00:02,  1.60it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:05<00:03,  1.01s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:06<00:01,  1.05it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:06<00:00,  1.20it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:07<00:00,  1.39it/s][A
2023-01-24 01:46:34 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:46:35 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8142
Mean: 0.5461
Std: 0.0219
IQR: 0.0266
Entropy: 0.0
Jitter: 0.0321
Per sample accuracy: 0.8135
Label stability: 0.9586




Analyze models in one run:  40%|████      | 2/5 [00:14<00:23,  7.74s/it]2023-01-24 01:46:37 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 3 / 5] Analyze RandomForestClassifier  ##############################
Model random_state:  303
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:01<00:14,  1.61s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:03<00:14,  1.80s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:05<00:12,  1.79s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:07<00:10,  1.78s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:09<00:09,  1.87s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:11<00:07,  1.95s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:13<00:05,  1.92s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:15<00:03,  2.00s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:17<00:02,  2.08s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:19<00:00,  1.93s/it][A
2023-01-24 01:46:57 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:46:58 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8385
Mean: 0.5481
Std: 0.0335
IQR: 0.0391
Entropy: 0.0
Jitter: 0.0334
Per sample accuracy: 0.8362
Label stability: 0.9571




Analyze models in one run:  60%|██████    | 3/5 [00:36<00:28, 14.38s/it]2023-01-24 01:47:00 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 4 / 5] Analyze XGBClassifier  ##############################
Model random_state:  304
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:01<00:15,  1.69s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:03<00:16,  2.01s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:06<00:16,  2.38s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:09<00:15,  2.62s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:13<00:15,  3.03s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:15<00:10,  2.67s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:18<00:08,  2.77s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:20<00:04,  2.42s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:24<00:03,  3.13s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:27<00:00,  2.78s/it][A
2023-01-24 01:47:28 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:47:29 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8255
Mean: 0.5392000079154968
Std: 0.02810000069439411
IQR: 0.0334
Entropy: 0.0
Jitter: 0.028
Per sample accuracy: 0.8249
Label stability: 0.964




Analyze models in one run:  80%|████████  | 4/5 [01:07<00:21, 21.07s/it]2023-01-24 01:47:31 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 5 / 5] Analyze KNeighborsClassifier  ##############################
Model random_state:  None
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:01,  4.98it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:00<00:01,  4.83it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:00<00:01,  3.86it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:01<00:01,  3.83it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:01<00:01,  3.53it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:01<00:01,  3.71it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:01<00:00,  3.74it/s][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:02<00:00,  3.65it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:02<00:00,  3.36it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:02<00:00,  3.60it/s][A
2023-01-24 01:47:34 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:47:35 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.81
Mean: 0.5216
Std: 0.0673
IQR: 0.0795
Entropy: 0.0
Jitter: 0.086
Per sample accuracy: 0.7994
Label stability: 0.8866




Analyze models in one run: 100%|██████████| 5/5 [01:13<00:00, 14.75s/it]








Analyze models in one run:   0%|          | 0/5 [00:00<?, ?it/s]2023-01-24 01:47:37 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap


##############################  [Model 1 / 5] Analyze DecisionTreeClassifier  ##############################
Model random_state:  401
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:00<00:00, 29.58it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:00<00:00, 32.27it/s][A
2023-01-24 01:47:37 abstract_overall_variance_analyzer.py INFO    : Successfully tested classifiers by bootstrap






2023-01-24 01:47:38 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8225
Mean: 0.5587
Std: 0.0518
IQR: 0.0547
Entropy: 0.0
Jitter: 0.0496
Per sample accuracy: 0.8182
Label stability: 0.9364




Analyze models in one run:  20%|██        | 1/5 [00:03<00:13,  3.31s/it]2023-01-24 01:47:40 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 2 / 5] Analyze LogisticRegression  ##############################
Model random_state:  402
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:02,  3.02it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:00<00:03,  2.09it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:01<00:03,  1.99it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:02<00:03,  1.79it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:02<00:02,  1.73it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:03<00:02,  1.79it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:03<00:01,  1.82it/s][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:04<00:01,  1.82it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:04<00:00,  1.80it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:05<00:00,  1.80it/s][A
2023-01-24 01:47:46 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:47:47 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8105
Mean: 0.5535
Std: 0.0215
IQR: 0.0253
Entropy: 0.0
Jitter: 0.0313
Per sample accuracy: 0.8108
Label stability: 0.9589




Analyze models in one run:  40%|████      | 2/5 [00:12<00:19,  6.51s/it]2023-01-24 01:47:49 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 3 / 5] Analyze RandomForestClassifier  ##############################
Model random_state:  403
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:01<00:13,  1.51s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:03<00:12,  1.53s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:04<00:10,  1.52s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:06<00:09,  1.57s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:07<00:07,  1.55s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:09<00:06,  1.52s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:10<00:04,  1.53s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:12<00:03,  1.59s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:14<00:01,  1.61s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:15<00:00,  1.56s/it][A
2023-01-24 01:48:05 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:48:06 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8258
Mean: 0.5502
Std: 0.0331
IQR: 0.0392
Entropy: 0.0
Jitter: 0.0358
Per sample accuracy: 0.8223
Label stability: 0.9542




Analyze models in one run:  60%|██████    | 3/5 [00:30<00:24, 12.14s/it]2023-01-24 01:48:08 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 4 / 5] Analyze XGBClassifier  ##############################
Model random_state:  404
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:01<00:14,  1.58s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:04<00:17,  2.15s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:06<00:14,  2.06s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:08<00:12,  2.01s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:10<00:10,  2.09s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:12<00:08,  2.12s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:14<00:05,  1.99s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:15<00:03,  1.93s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:18<00:02,  2.15s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:20<00:00,  2.03s/it][A
2023-01-24 01:48:28 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:48:29 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8358
Mean: 0.5471000075340271
Std: 0.027899999171495438
IQR: 0.0331
Entropy: 0.0
Jitter: 0.0267
Per sample accuracy: 0.8357
Label stability: 0.9655




Analyze models in one run:  80%|████████  | 4/5 [00:54<00:16, 16.71s/it]2023-01-24 01:48:32 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 5 / 5] Analyze KNeighborsClassifier  ##############################
Model random_state:  None
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:01,  5.27it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:00<00:01,  5.09it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:00<00:01,  4.66it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:00<00:01,  4.45it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:01<00:01,  4.07it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:01<00:00,  4.13it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:01<00:00,  3.99it/s][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:01<00:00,  4.09it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:02<00:00,  3.78it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:02<00:00,  4.12it/s][A
2023-01-24 01:48:34 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:48:35 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8088
Mean: 0.5301
Std: 0.0668
IQR: 0.0808
Entropy: 0.0
Jitter: 0.085
Per sample accuracy: 0.8002
Label stability: 0.8892




Analyze models in one run: 100%|██████████| 5/5 [01:00<00:00, 12.05s/it]








Analyze models in one run:   0%|          | 0/5 [00:00<?, ?it/s]2023-01-24 01:48:37 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap


##############################  [Model 1 / 5] Analyze DecisionTreeClassifier  ##############################
Model random_state:  501
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:00<00:00, 33.18it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:00<00:00, 33.80it/s][A
2023-01-24 01:48:38 abstract_overall_variance_analyzer.py INFO    : Successfully tested classifiers by bootstrap






2023-01-24 01:48:38 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8168
Mean: 0.5526
Std: 0.0657
IQR: 0.0667
Entropy: 0.0
Jitter: 0.0671
Per sample accuracy: 0.8065
Label stability: 0.9138




Analyze models in one run:  20%|██        | 1/5 [00:03<00:12,  3.24s/it]2023-01-24 01:48:41 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 2 / 5] Analyze LogisticRegression  ##############################
Model random_state:  502
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:03,  2.67it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:00<00:03,  2.21it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:01<00:03,  2.00it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:02<00:03,  1.55it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:02<00:03,  1.52it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:03<00:02,  1.67it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:04<00:01,  1.73it/s][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:04<00:01,  1.77it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:05<00:00,  1.79it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:05<00:00,  1.77it/s][A
2023-01-24 01:48:46 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:48:47 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8152
Mean: 0.5543
Std: 0.0214
IQR: 0.0258
Entropy: 0.0
Jitter: 0.0284
Per sample accuracy: 0.8131
Label stability: 0.9623




Analyze models in one run:  40%|████      | 2/5 [00:11<00:19,  6.46s/it]2023-01-24 01:48:49 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 3 / 5] Analyze RandomForestClassifier  ##############################
Model random_state:  503
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:01<00:14,  1.56s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:03<00:12,  1.51s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:04<00:10,  1.49s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:06<00:09,  1.56s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:07<00:07,  1.58s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:09<00:06,  1.59s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:11<00:04,  1.60s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:12<00:03,  1.62s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:14<00:01,  1.58s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:15<00:00,  1.56s/it][A
2023-01-24 01:49:05 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:49:06 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8358
Mean: 0.5482
Std: 0.0341
IQR: 0.0409
Entropy: 0.0
Jitter: 0.0353
Per sample accuracy: 0.8313
Label stability: 0.955




Analyze models in one run:  60%|██████    | 3/5 [00:30<00:24, 12.05s/it]2023-01-24 01:49:08 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 4 / 5] Analyze XGBClassifier  ##############################
Model random_state:  504
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:01<00:14,  1.61s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:03<00:13,  1.72s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:06<00:17,  2.54s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:08<00:13,  2.21s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:11<00:12,  2.45s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:13<00:08,  2.24s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:15<00:06,  2.07s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:17<00:04,  2.29s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:19<00:02,  2.13s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:21<00:00,  2.14s/it][A
2023-01-24 01:49:29 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:49:30 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.838
Mean: 0.555400013923645
Std: 0.028699999675154686
IQR: 0.0346
Entropy: 0.0
Jitter: 0.0298
Per sample accuracy: 0.8346
Label stability: 0.9614




Analyze models in one run:  80%|████████  | 4/5 [00:55<00:17, 17.05s/it]2023-01-24 01:49:33 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 5 / 5] Analyze KNeighborsClassifier  ##############################
Model random_state:  None
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:04,  1.98it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:00<00:02,  2.80it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:01<00:02,  3.28it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:01<00:01,  3.50it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:01<00:01,  3.75it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:01<00:01,  3.76it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:01<00:00,  3.91it/s][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:02<00:00,  3.87it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:02<00:00,  4.02it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:02<00:00,  3.61it/s][A
2023-01-24 01:49:35 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:49:36 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8042
Mean: 0.5207
Std: 0.068
IQR: 0.0817
Entropy: 0.0
Jitter: 0.0845
Per sample accuracy: 0.7961
Label stability: 0.8908




Analyze models in one run: 100%|██████████| 5/5 [01:01<00:00, 12.26s/it]








Analyze models in one run:   0%|          | 0/5 [00:00<?, ?it/s]2023-01-24 01:49:39 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap


##############################  [Model 1 / 5] Analyze DecisionTreeClassifier  ##############################
Model random_state:  601
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:00<00:00, 31.92it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:00<00:00, 32.86it/s][A
2023-01-24 01:49:39 abstract_overall_variance_analyzer.py INFO    : Successfully tested classifiers by bootstrap






2023-01-24 01:49:40 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8215
Mean: 0.5443
Std: 0.0567
IQR: 0.059
Entropy: 0.0
Jitter: 0.0276
Per sample accuracy: 0.8172
Label stability: 0.9667




Analyze models in one run:  20%|██        | 1/5 [00:03<00:13,  3.43s/it]2023-01-24 01:49:42 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 2 / 5] Analyze LogisticRegression  ##############################
Model random_state:  602
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:06,  1.49it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:01<00:05,  1.49it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:01<00:04,  1.62it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:02<00:03,  1.67it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:02<00:02,  1.74it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:03<00:02,  1.81it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:04<00:01,  1.82it/s][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:04<00:01,  1.87it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:05<00:00,  1.93it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:05<00:00,  1.80it/s][A
2023-01-24 01:49:48 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:49:49 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8025
Mean: 0.5463
Std: 0.0238
IQR: 0.029
Entropy: 0.0
Jitter: 0.0317
Per sample accuracy: 0.8029
Label stability: 0.9589




Analyze models in one run:  40%|████      | 2/5 [00:12<00:19,  6.60s/it]2023-01-24 01:49:51 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 3 / 5] Analyze RandomForestClassifier  ##############################
Model random_state:  603
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:01<00:13,  1.45s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:03<00:12,  1.52s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:04<00:11,  1.58s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:06<00:09,  1.53s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:07<00:07,  1.50s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:09<00:05,  1.49s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:10<00:04,  1.55s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:12<00:03,  1.54s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:13<00:01,  1.52s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:15<00:00,  1.52s/it][A
2023-01-24 01:50:06 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:50:07 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8362
Mean: 0.5487
Std: 0.0344
IQR: 0.0409
Entropy: 0.0
Jitter: 0.0378
Per sample accuracy: 0.8303
Label stability: 0.9512




Analyze models in one run:  60%|██████    | 3/5 [00:30<00:23, 11.90s/it]2023-01-24 01:50:09 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 4 / 5] Analyze XGBClassifier  ##############################
Model random_state:  604
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:01<00:14,  1.64s/it][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:04<00:18,  2.31s/it][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:06<00:14,  2.05s/it][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:08<00:11,  1.98s/it][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:10<00:11,  2.23s/it][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:12<00:08,  2.06s/it][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:14<00:06,  2.04s/it][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:17<00:04,  2.24s/it][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:18<00:02,  2.09s/it][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:20<00:00,  2.06s/it][A
2023-01-24 01:50:30 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:50:31 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.8248
Mean: 0.5422999858856201
Std: 0.028599999845027924
IQR: 0.0345
Entropy: 0.0
Jitter: 0.0296
Per sample accuracy: 0.8236
Label stability: 0.9626




Analyze models in one run:  80%|████████  | 4/5 [00:54<00:16, 16.64s/it]2023-01-24 01:50:33 abstract_overall_variance_analyzer.py INFO    : Start classifiers testing by bootstrap






##############################  [Model 5 / 5] Analyze KNeighborsClassifier  ##############################
Model random_state:  None
Baseline X_train shape:  (16000, 16)
Baseline X_test shape:  (4000, 16)





Classifiers testing by bootstrap:   0%|          | 0/10 [00:00<?, ?it/s][A
Classifiers testing by bootstrap:  10%|█         | 1/10 [00:00<00:01,  5.84it/s][A
Classifiers testing by bootstrap:  20%|██        | 2/10 [00:00<00:01,  4.84it/s][A
Classifiers testing by bootstrap:  30%|███       | 3/10 [00:00<00:01,  4.73it/s][A
Classifiers testing by bootstrap:  40%|████      | 4/10 [00:00<00:01,  4.26it/s][A
Classifiers testing by bootstrap:  50%|█████     | 5/10 [00:01<00:01,  4.19it/s][A
Classifiers testing by bootstrap:  60%|██████    | 6/10 [00:01<00:01,  3.94it/s][A
Classifiers testing by bootstrap:  70%|███████   | 7/10 [00:01<00:00,  4.15it/s][A
Classifiers testing by bootstrap:  80%|████████  | 8/10 [00:01<00:00,  3.94it/s][A
Classifiers testing by bootstrap:  90%|█████████ | 9/10 [00:02<00:00,  3.85it/s][A
Classifiers testing by bootstrap: 100%|██████████| 10/10 [00:02<00:00,  4.06it/s][A
2023-01-24 01:50:35 abstract_overall_variance_analyzer.py INFO    : Successfully t





2023-01-24 01:50:36 abstract_overall_variance_analyzer.py INFO    : Successfully computed predict proba metrics




##############################  Stability metrics  ##############################
General Ensemble Accuracy: 0.811
Mean: 0.5283
Std: 0.0669
IQR: 0.0811
Entropy: 0.1261
Jitter: 0.0916
Per sample accuracy: 0.8039
Label stability: 0.881




Analyze models in one run: 100%|██████████| 5/5 [01:00<00:00, 12.01s/it]








