# Experiment Eurythmy Letter

In [1]:
from PlantReactivityAnalysis.features.features_dataset import FeaturesDataset
from PlantReactivityAnalysis.models.experiment import Experiment
import PlantReactivityAnalysis.models.get_dataset as gd
import PlantReactivityAnalysis.models.parameters as param
from PlantReactivityAnalysis.config import PROCESSED_DATA_DIR

In [2]:
import numpy as np
import pandas as pd
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)

# Preparation

In [3]:
ct= 0.8
pca= 60
ws= 1
hl= 0.5
rqs= [1,2]
datasets_ids= [1,2,3,4,5,7,9,10,11,12,13,15,]
norm_path = r"../data/processed/feat_norm_letters_1_0.5_dataset.pkl"
raw_path = r"../data/processed/feat_raw_letters_1_0.5_dataset.pkl"

In [4]:
datasets= gd.collect_all_rqs_data(norm_path, raw_path, rqs, corr_threshold=ct, pca_dim=pca)
#datasets={}
#datasets[1]=gd.return_ct_datasets1(ct)


PROCESSING DATASET 1
Removing columns with NaN values: ['skewness', 'kurtosis']

# Research Question:  1
-Train distribution-
Counts and Percentages:
Class 1: Count = 3576, Percentage = 50.35%
Class 0: Count = 3526, Percentage = 49.65%
-Test distribution-
Counts and Percentages:
Class 1: Count = 907, Percentage = 51.07%
Class 0: Count = 869, Percentage = 48.93%
Reduced variable features from initial count to 46.
Reduced features based on correlation threshold of 0.8
Variable features were properly normalized using 'zscore' method.
Applied z-score normalization.

# Research Question:  2
-Train distribution-
Counts and Percentages:
Class 2: Count = 1013, Percentage = 33.59%
Class 0: Count = 1004, Percentage = 33.29%
Class 1: Count = 999, Percentage = 33.12%
-Test distribution-
Counts and Percentages:
Class 0: Count = 257, Percentage = 34.04%
Class 1: Count = 256, Percentage = 33.91%
Class 2: Count = 242, Percentage = 32.05%
Reduced variable features from initial count to 43.
Reduced fea

# RQX

In [5]:
%%time

results = {}  # Initialize an empty dictionary to store results

for ds in [1,2,3,4,5,7]:  # For each dataset
    print(f"Now processing Dataset {ds}...")  # Print the current dataset being processed
    results[ds] = {}  # Initialize a nested dictionary for each dataset
    for rq in [1, 2]:  # For each research question
        print(f"  Processing RQ {rq} within Dataset {ds}...")  # Print the current RQ being processed

        if ds in [1,2,3,4,5,7]:
            train_df, test_df = datasets[ds][rq]
            experiment = Experiment(train_df, test_df, 'target')
        else:
            train_df, train_targets, test_df, test_targets = datasets[ds][rq]
            experiment = Experiment.from_arrays(train_df, train_targets, test_df, test_targets)
            
        if ds in [2,4,6,8,10,12,14,16]:
            experiment.run_all_models(param.PARAMETER_GRID_NO_SCALING)
        else:
            experiment.run_all_models(param.PARAMETER_GRID)
        
        # Store the results of the experiment, along with the dataset and RQ identifiers
        results[ds][rq] = experiment.results

Now processing Dataset 1...
  Processing RQ 1 within Dataset 1...
Running experiments for svm with params: {'C': 0.1, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}




Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}




[LightGBM] [Info] Number of positive: 3576, number of negative: 3526
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003498 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11381
[LightGBM] [Info] Number of data points in the train set: 7102, number of used features: 45
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.503520 -> initscore=0.014081
[LightGBM] [Info] Start training from score 0.014081
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Number of positive: 3576, number of negative: 3526
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002498 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11381
[LightGBM] [Info] Number of data points in the train set: 7102, number of used features: 45
[LightGBM] [Info] [binary:BoostFromScore]: pavg=



Running experiments for svm with params: {'C': 0.1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}




Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002508 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 10501
[LightGBM] [Info] Number of data points in the train set: 3016, number of used features: 42
[LightGBM] [Info] Start training from score -1.099939
[LightGBM] [Info] Start training from score -1.104932
[LightGBM] [Info] Start training from score -1.091015




Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002350 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 10501
[LightGBM] [Info] Number of data points in the train set: 3016, number of used features: 42
[LightGBM] [Info] Start training from score -1.099939
[LightGBM] [Info] Start training from score -1.104932
[LightGBM] [Info] Start training from score -1.091015
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 200, 'num_leaves': 31}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002285 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 10501
[LightGBM] [Info] Number of data points in the train set: 3016, number of used features: 42
[LightGBM] [Info] Start training from score -1.09993



Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}




[LightGBM] [Info] Number of positive: 3576, number of negative: 3526
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003406 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11396
[LightGBM] [Info] Number of data points in the train set: 7102, number of used features: 45
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.503520 -> initscore=0.014081
[LightGBM] [Info] Start training from score 0.014081
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Number of positive: 3576, number of negative: 3526
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003526 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11396
[LightGBM] [Info] Number of data points in the train set: 7102, number of used features: 45
[LightGBM] [Info] [binary:BoostFromScore]: pavg=



Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001264 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 10500
[LightGBM] [Info] Number of data points in the train set: 3016, number of used features: 42
[LightGBM] [Info] Start training from score -1.099939
[LightGBM] [Info] Start training from score -1.104932
[LightGBM] [Info] Start training from score -1.091015




Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001088 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 10500
[LightGBM] [Info] Number of data points in the train set: 3016, number of used features: 42
[LightGBM] [Info] Start training from score -1.099939
[LightGBM] [Info] Start training from score -1.104932
[LightGBM] [Info] Start training from score -1.091015
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 200, 'num_leaves': 31}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001236 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 10500
[LightGBM] [Info] Number of data points in the train set: 3016, number of used features: 42
[LightGBM] [Info] Start training from score -1.09993



Running experiments for svm with params: {'C': 0.1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}




Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}
[LightGBM] [Info] Number of positive: 3576, number of negative: 3506
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002487 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11668
[LightGBM] [Info] Number of data points in the train set: 7082, number of used features: 46
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.504942 -> initscore=0.019769
[LightGBM] [Info] Start training from score 0.019769




Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Number of positive: 3576, number of negative: 3506
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002574 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11668
[LightGBM] [Info] Number of data points in the train set: 7082, number of used features: 46
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.504942 -> initscore=0.019769
[LightGBM] [Info] Start training from score 0.019769
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 200, 'num_leaves': 31}
[LightGBM] [Info] Number of positive: 3576, number of negative: 3506
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002285 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11668
[LightGBM] [Info] Number of data poi



Running experiments for svm with params: {'C': 0.1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001124 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11776
[LightGBM] [Info] Number of data points in the train set: 3002, number of used features: 47
[LightGBM] [Info] Start training from score -1.090319
[LightGBM] [Info] Start training from score -1.098279
[LightGBM] [Info] Start training from score -1.107311




Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001198 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11776
[LightGBM] [Info] Number of data points in the train set: 3002, number of used features: 47
[LightGBM] [Info] Start training from score -1.090319
[LightGBM] [Info] Start training from score -1.098279
[LightGBM] [Info] Start training from score -1.107311
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 200, 'num_leaves': 31}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001248 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11776
[LightGBM] [Info] Number of data points in the train set: 3002, number of used features: 47
[LightGBM] [Info] Start training from score -1.09031



Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}
[LightGBM] [Info] Number of positive: 3576, number of negative: 3506




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002302 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11648
[LightGBM] [Info] Number of data points in the train set: 7082, number of used features: 46
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.504942 -> initscore=0.019769
[LightGBM] [Info] Start training from score 0.019769
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Number of positive: 3576, number of negative: 3506
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002445 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11648
[LightGBM] [Info] Number of data points in the train set: 7082, number of used features: 46
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.504942 -> initscore=0.019769
[LightGBM] [Info] Start training from 



Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}


  _warn_prf(average, modifier, msg_start, len(result))


Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002779 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11824
[LightGBM] [Info] Number of data points in the train set: 3002, number of used features: 47
[LightGBM] [Info] Start training from score -1.090319
[LightGBM] [Info] Start training from score -1.098279
[LightGBM] [Info] Start training from score -1.107311




Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001612 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11824
[LightGBM] [Info] Number of data points in the train set: 3002, number of used features: 47
[LightGBM] [Info] Start training from score -1.090319
[LightGBM] [Info] Start training from score -1.098279
[LightGBM] [Info] Start training from score -1.107311
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 200, 'num_leaves': 31}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001407 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11824
[LightGBM] [Info] Number of data points in the train set: 3002, number of used features: 47
[LightGBM] [Info] Start training from score -1.09031



Running experiments for svm with params: {'C': 0.1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}
[LightGBM] [Info] Number of positive: 3576, number of negative: 3526




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002492 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11126
[LightGBM] [Info] Number of data points in the train set: 7102, number of used features: 44
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.503520 -> initscore=0.014081
[LightGBM] [Info] Start training from score 0.014081
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Number of positive: 3576, number of negative: 3526
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002140 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11126
[LightGBM] [Info] Number of data points in the train set: 7102, number of used features: 44
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.503520 -> initscore=0.014081
[LightGBM] [Info] Start training from 



Running experiments for svm with params: {'C': 0.1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}




Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}




Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001494 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11061
[LightGBM] [Info] Number of data points in the train set: 3016, number of used features: 45
[LightGBM] [Info] Start training from score -1.099939
[LightGBM] [Info] Start training from score -1.104932
[LightGBM] [Info] Start training from score -1.091015
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001169 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11061
[LightGBM] [Info] Number of data points in the train set: 3016, number of used features: 45
[LightGBM] [Info] Start training from score -1.09993



Running experiments for svm with params: {'C': 0.1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}




Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}
[LightGBM] [Info] Number of positive: 3576, number of negative: 3506
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003591 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11413
[LightGBM] [Info] Number of data points in the train set: 7082, number of used features: 45
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.504942 -> initscore=0.019769
[LightGBM] [Info] Start training from score 0.019769
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Number of positive: 3576, number of negative: 3506
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003233 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11413
[LightGBM] [Info] Number of data poi



Running experiments for svm with params: {'C': 0.1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 0.1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 1, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'scale', 'kernel': 'rbf'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'linear'}




Running experiments for svm with params: {'C': 10, 'gamma': 'auto', 'kernel': 'rbf'}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 10, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 300}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for randomforest with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 300}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.1, 'max_depth': 5, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 3, 'n_estimators': 200}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 100}




Running experiments for gradientboosting with params: {'learning_rate': 0.05, 'max_depth': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': None, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 2, 'n_estimators': 200}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 100}




Running experiments for extratrees with params: {'max_depth': 20, 'min_samples_split': 5, 'n_estimators': 200}




Running experiments for gaussiannb with params: {'var_smoothing': 1e-09}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-08}
Running experiments for gaussiannb with params: {'var_smoothing': 1e-10}
Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 0.1, 'n_estimators': 100}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 50}




Running experiments for adaboost with params: {'learning_rate': 1.0, 'n_estimators': 100}




Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'liblinear'}
Running experiments for logisticregression with params: {'C': 0.1, 'solver': 'lbfgs'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 1, 'solver': 'lbfgs'}
Running experiments for logisticregression with params: {'C': 10, 'solver': 'liblinear'}




Running experiments for logisticregression with params: {'C': 10, 'solver': 'lbfgs'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'uniform'}
Running experiments for kneighbors with params: {'n_neighbors': 5, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 10, 'weights': 'distance'}
Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'uniform'}




Running experiments for kneighbors with params: {'n_neighbors': 15, 'weights': 'distance'}
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 31}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001440 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11829
[LightGBM] [Info] Number of data points in the train set: 3002, number of used features: 48
[LightGBM] [Info] Start training from score -1.090319
[LightGBM] [Info] Start training from score -1.098279
[LightGBM] [Info] Start training from score -1.107311




Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 100, 'num_leaves': 64}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001537 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11829
[LightGBM] [Info] Number of data points in the train set: 3002, number of used features: 48
[LightGBM] [Info] Start training from score -1.090319
[LightGBM] [Info] Start training from score -1.098279
[LightGBM] [Info] Start training from score -1.107311
Running experiments for lgbm with params: {'learning_rate': 0.1, 'n_estimators': 200, 'num_leaves': 31}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001327 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 11829
[LightGBM] [Info] Number of data points in the train set: 3002, number of used features: 48
[LightGBM] [Info] Start training from score -1.09031

In [6]:
# Prepare a list to hold all rows before creating the DataFrame
rows = []

# Iterate over the nested structure to access each experiment's results
for ds, rqs in results.items():
    for rq, experiments in rqs.items():
        for experiment_result in experiments:
            rows.append({
                'Dataset': ds,
                'RQ': rq,
                'Window Size': ws,
                'Hop Length': hl,
                'Corr Tres/ PCA Dim': ct if ds in [1, 2, 3, 4, 5, 7] else pca,
                'Model': experiment_result['model_name'],
                'Parameter': str(experiment_result['parameters']),
                'F1 Score': experiment_result['f1'],
                'Accuracy': experiment_result['accuracy'],
                'Precision': experiment_result['precision'],
                'Recall': experiment_result['recall']
            })

# Convert the list of dictionaries into a DataFrame
df_results = pd.DataFrame(rows)
df_results.shape

(924, 11)

In [7]:
def update_csv_with_new_rows(csv_path, new_data_df):
    try:
        existing_data_df = pd.read_csv(csv_path)
        print("read",csv_path)
    except FileNotFoundError:
        existing_data_df = pd.DataFrame()

    combined_df = pd.concat([existing_data_df, new_data_df], ignore_index=True).drop_duplicates()

    combined_df.to_csv(csv_path, index=False)

In [8]:
results_file=  r"results.csv"
update_csv_with_new_rows(results_file, df_results)

read results.csv
