# Programming environment

In [1]:
# Define the seed for reproducibility
seed = 2024-9-10

In [2]:
# Load existing functions from libraries
from sklearn.metrics import mean_squared_error, make_scorer, precision_score

In [3]:
# Load custom functions from utils.py
from utils import train_and_save_model, load_and_predict, compute_shap_values

IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html


In [4]:
from sklearn.linear_model import LogisticRegression
from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier
from sklearn.svm import SVC
from sklearn.neural_network import MLPClassifier

# Adding the required numpy import for parameter scaling
import numpy as np

# Define models and their parameter grids
models_and_params = {
    'LogisticRegression': {
        'model': LogisticRegression(penalty='l2', solver='lbfgs', max_iter=1000),
        'param_grid': {
            'C': np.logspace(-4, 4, 10)  # Regularization strength for logistic regression
        }
    },
    'RandomForest': {
        'model': RandomForestClassifier(min_samples_split=20, max_features=None),
        'param_grid': {
            'n_estimators': [100, 200, 300],  # Number of trees in the forest
            'max_depth': [3, 5, 10]  # Maximum depth of the tree
        }
    },
    'GradientBoosting': {
        'model': GradientBoostingClassifier(learning_rate=0.01),
        'param_grid': {
            'n_estimators': [100, 200, 300],  # Number of boosting stages to perform
            'max_depth': [3, 5, 10]  # Maximum depth of the individual regression estimators
        }
    },
    'DeepNeuralNetwork': {
        'model': MLPClassifier(max_iter=1000, hidden_layer_sizes=(50, 50), activation='relu', solver = 'sgd', learning_rate_init=0.001),
        'param_grid': {
            'alpha': np.logspace(-4, 4, 10)  # L2 penalty (regularization term) parameter
        }
    }
}

In [5]:
import shap

# Corresponding explainers
explainers = {
    'LogisticRegression': shap.LinearExplainer,
    'RandomForest': shap.TreeExplainer,
    'GradientBoosting': shap.TreeExplainer,
    'DeepNeuralNetwork': shap.KernelExplainer
}

# Predictive modeling

## Survival prediction

In [6]:
prefix = 'survive_baseline1_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/survive_baseline1_rr_scaler.joblib
Model saved at inst/extdata/model/survive_baseline1_rr_best_model.joblib
Results saved at inst/extdata/model/survive_baseline1_rr_train_prob.csv
Results saved at inst/extdata/model/survive_baseline1_rr_validation_prob.csv
Results saved at inst/extdata/model/survive_baseline1_rr_test_prob.csv


In [6]:
prefix = 'survive_baseline1_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/survive_baseline1_rr_independent_test_prob.csv


In [6]:
prefix = 'survive_baseline1_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

Results saved at inst/extdata/model/survive_baseline1_rr_train_shap_values.csv


In [8]:
prefix = 'survive_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/survive_stack_rr_scaler.joblib
Model saved at inst/extdata/model/survive_stack_rr_best_model.joblib
Results saved at inst/extdata/model/survive_stack_rr_train_prob.csv
Results saved at inst/extdata/model/survive_stack_rr_validation_prob.csv
Results saved at inst/extdata/model/survive_stack_rr_test_prob.csv


In [7]:
prefix = 'survive_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/survive_stack_rr_independent_test_prob.csv


In [9]:
prefix = 'survive_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/survive_stack_rf_scaler.joblib
Model saved at inst/extdata/model/survive_stack_rf_best_model.joblib
Results saved at inst/extdata/model/survive_stack_rf_train_prob.csv
Results saved at inst/extdata/model/survive_stack_rf_validation_prob.csv
Results saved at inst/extdata/model/survive_stack_rf_test_prob.csv


In [8]:
prefix = 'survive_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/survive_stack_rf_independent_test_prob.csv


In [10]:
prefix = 'survive_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/survive_stack_gbm_scaler.joblib
Model saved at inst/extdata/model/survive_stack_gbm_best_model.joblib
Results saved at inst/extdata/model/survive_stack_gbm_train_prob.csv
Results saved at inst/extdata/model/survive_stack_gbm_validation_prob.csv
Results saved at inst/extdata/model/survive_stack_gbm_test_prob.csv


In [9]:
prefix = 'survive_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/survive_stack_gbm_independent_test_prob.csv


In [11]:
prefix = 'survive_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/survive_stack_dnn_scaler.joblib
Model saved at inst/extdata/model/survive_stack_dnn_best_model.joblib
Results saved at inst/extdata/model/survive_stack_dnn_train_prob.csv
Results saved at inst/extdata/model/survive_stack_dnn_validation_prob.csv
Results saved at inst/extdata/model/survive_stack_dnn_test_prob.csv


In [10]:
prefix = 'survive_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/survive_stack_dnn_independent_test_prob.csv


In [7]:
prefix = 'survive_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

100%|█| 20551/20551 [07:45<00:00, 44.11it/


Results saved at inst/extdata/model/survive_stack_dnn_train_shap_values.csv


## Severe ROP prediction

In [12]:
prefix = 'rop_severe_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/rop_severe_stack_rr_scaler.joblib
Model saved at inst/extdata/model/rop_severe_stack_rr_best_model.joblib
Results saved at inst/extdata/model/rop_severe_stack_rr_train_prob.csv
Results saved at inst/extdata/model/rop_severe_stack_rr_validation_prob.csv
Results saved at inst/extdata/model/rop_severe_stack_rr_test_prob.csv


In [11]:
prefix = 'rop_severe_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/rop_severe_stack_rr_independent_test_prob.csv


In [7]:
prefix = 'rop_severe_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

Results saved at inst/extdata/model/rop_severe_stack_rr_train_shap_values.csv


In [13]:
prefix = 'rop_severe_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/rop_severe_stack_rf_scaler.joblib
Model saved at inst/extdata/model/rop_severe_stack_rf_best_model.joblib
Results saved at inst/extdata/model/rop_severe_stack_rf_train_prob.csv
Results saved at inst/extdata/model/rop_severe_stack_rf_validation_prob.csv
Results saved at inst/extdata/model/rop_severe_stack_rf_test_prob.csv


In [12]:
prefix = 'rop_severe_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/rop_severe_stack_rf_independent_test_prob.csv


In [14]:
prefix = 'rop_severe_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/rop_severe_stack_gbm_scaler.joblib
Model saved at inst/extdata/model/rop_severe_stack_gbm_best_model.joblib
Results saved at inst/extdata/model/rop_severe_stack_gbm_train_prob.csv
Results saved at inst/extdata/model/rop_severe_stack_gbm_validation_prob.csv
Results saved at inst/extdata/model/rop_severe_stack_gbm_test_prob.csv


In [13]:
prefix = 'rop_severe_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/rop_severe_stack_gbm_independent_test_prob.csv


In [15]:
prefix = 'rop_severe_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/rop_severe_stack_dnn_scaler.joblib
Model saved at inst/extdata/model/rop_severe_stack_dnn_best_model.joblib
Results saved at inst/extdata/model/rop_severe_stack_dnn_train_prob.csv
Results saved at inst/extdata/model/rop_severe_stack_dnn_validation_prob.csv
Results saved at inst/extdata/model/rop_severe_stack_dnn_test_prob.csv


In [14]:
prefix = 'rop_severe_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/rop_severe_stack_dnn_independent_test_prob.csv


## BPD prediction

In [17]:
prefix = 'bpd_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/bpd_stack_rr_scaler.joblib
Model saved at inst/extdata/model/bpd_stack_rr_best_model.joblib
Results saved at inst/extdata/model/bpd_stack_rr_train_prob.csv
Results saved at inst/extdata/model/bpd_stack_rr_validation_prob.csv
Results saved at inst/extdata/model/bpd_stack_rr_test_prob.csv


In [15]:
prefix = 'bpd_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/bpd_stack_rr_independent_test_prob.csv


In [18]:
prefix = 'bpd_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/bpd_stack_rf_scaler.joblib
Model saved at inst/extdata/model/bpd_stack_rf_best_model.joblib
Results saved at inst/extdata/model/bpd_stack_rf_train_prob.csv
Results saved at inst/extdata/model/bpd_stack_rf_validation_prob.csv
Results saved at inst/extdata/model/bpd_stack_rf_test_prob.csv


In [16]:
prefix = 'bpd_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/bpd_stack_rf_independent_test_prob.csv


In [9]:
prefix = 'bpd_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

Results saved at inst/extdata/model/bpd_stack_rf_train_shap_values.csv


In [19]:
prefix = 'bpd_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/bpd_stack_gbm_scaler.joblib
Model saved at inst/extdata/model/bpd_stack_gbm_best_model.joblib
Results saved at inst/extdata/model/bpd_stack_gbm_train_prob.csv
Results saved at inst/extdata/model/bpd_stack_gbm_validation_prob.csv
Results saved at inst/extdata/model/bpd_stack_gbm_test_prob.csv


In [17]:
prefix = 'bpd_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/bpd_stack_gbm_independent_test_prob.csv


In [20]:
prefix = 'bpd_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/bpd_stack_dnn_scaler.joblib




Model saved at inst/extdata/model/bpd_stack_dnn_best_model.joblib
Results saved at inst/extdata/model/bpd_stack_dnn_train_prob.csv
Results saved at inst/extdata/model/bpd_stack_dnn_validation_prob.csv
Results saved at inst/extdata/model/bpd_stack_dnn_test_prob.csv


In [18]:
prefix = 'bpd_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/bpd_stack_dnn_independent_test_prob.csv


## Moderate/severe BPD prediction

In [22]:
prefix = 'bpd_moderate_severe_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/bpd_moderate_severe_stack_rr_scaler.joblib
Model saved at inst/extdata/model/bpd_moderate_severe_stack_rr_best_model.joblib
Results saved at inst/extdata/model/bpd_moderate_severe_stack_rr_train_prob.csv
Results saved at inst/extdata/model/bpd_moderate_severe_stack_rr_validation_prob.csv
Results saved at inst/extdata/model/bpd_moderate_severe_stack_rr_test_prob.csv


In [19]:
prefix = 'bpd_moderate_severe_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/bpd_moderate_severe_stack_rr_independent_test_prob.csv


In [23]:
prefix = 'bpd_moderate_severe_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/bpd_moderate_severe_stack_rf_scaler.joblib
Model saved at inst/extdata/model/bpd_moderate_severe_stack_rf_best_model.joblib
Results saved at inst/extdata/model/bpd_moderate_severe_stack_rf_train_prob.csv
Results saved at inst/extdata/model/bpd_moderate_severe_stack_rf_validation_prob.csv
Results saved at inst/extdata/model/bpd_moderate_severe_stack_rf_test_prob.csv


In [20]:
prefix = 'bpd_moderate_severe_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/bpd_moderate_severe_stack_rf_independent_test_prob.csv


In [10]:
prefix = 'bpd_moderate_severe_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

Results saved at inst/extdata/model/bpd_moderate_severe_stack_rf_train_shap_values.csv


In [24]:
prefix = 'bpd_moderate_severe_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/bpd_moderate_severe_stack_gbm_scaler.joblib
Model saved at inst/extdata/model/bpd_moderate_severe_stack_gbm_best_model.joblib
Results saved at inst/extdata/model/bpd_moderate_severe_stack_gbm_train_prob.csv
Results saved at inst/extdata/model/bpd_moderate_severe_stack_gbm_validation_prob.csv
Results saved at inst/extdata/model/bpd_moderate_severe_stack_gbm_test_prob.csv


In [21]:
prefix = 'bpd_moderate_severe_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/bpd_moderate_severe_stack_gbm_independent_test_prob.csv


In [25]:
prefix = 'bpd_moderate_severe_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/bpd_moderate_severe_stack_dnn_scaler.joblib




Model saved at inst/extdata/model/bpd_moderate_severe_stack_dnn_best_model.joblib
Results saved at inst/extdata/model/bpd_moderate_severe_stack_dnn_train_prob.csv
Results saved at inst/extdata/model/bpd_moderate_severe_stack_dnn_validation_prob.csv
Results saved at inst/extdata/model/bpd_moderate_severe_stack_dnn_test_prob.csv


In [22]:
prefix = 'bpd_moderate_severe_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/bpd_moderate_severe_stack_dnn_independent_test_prob.csv


## EUGR-HC prediction

In [27]:
prefix = 'eugr_hc_baseline2_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_hc_baseline2_rr_scaler.joblib
Model saved at inst/extdata/model/eugr_hc_baseline2_rr_best_model.joblib
Results saved at inst/extdata/model/eugr_hc_baseline2_rr_train_prob.csv
Results saved at inst/extdata/model/eugr_hc_baseline2_rr_validation_prob.csv
Results saved at inst/extdata/model/eugr_hc_baseline2_rr_test_prob.csv


In [23]:
prefix = 'eugr_hc_baseline2_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_hc_baseline2_rr_independent_test_prob.csv


In [8]:
prefix = 'eugr_hc_baseline2_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

Results saved at inst/extdata/model/eugr_hc_baseline2_rr_train_shap_values.csv


In [29]:
prefix = 'eugr_hc_stack1_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_hc_stack1_rr_scaler.joblib
Model saved at inst/extdata/model/eugr_hc_stack1_rr_best_model.joblib
Results saved at inst/extdata/model/eugr_hc_stack1_rr_train_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack1_rr_validation_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack1_rr_test_prob.csv


In [24]:
prefix = 'eugr_hc_stack1_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_hc_stack1_rr_independent_test_prob.csv


In [30]:
prefix = 'eugr_hc_stack1_rf'
model_name = 'RandomForest'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_hc_stack1_rf_scaler.joblib
Model saved at inst/extdata/model/eugr_hc_stack1_rf_best_model.joblib
Results saved at inst/extdata/model/eugr_hc_stack1_rf_train_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack1_rf_validation_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack1_rf_test_prob.csv


In [25]:
prefix = 'eugr_hc_stack1_rf'
model_name = 'RandomForest'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_hc_stack1_rf_independent_test_prob.csv


In [31]:
prefix = 'eugr_hc_stack1_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_hc_stack1_gbm_scaler.joblib
Model saved at inst/extdata/model/eugr_hc_stack1_gbm_best_model.joblib
Results saved at inst/extdata/model/eugr_hc_stack1_gbm_train_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack1_gbm_validation_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack1_gbm_test_prob.csv


In [26]:
prefix = 'eugr_hc_stack1_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_hc_stack1_gbm_independent_test_prob.csv


In [32]:
prefix = 'eugr_hc_stack1_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_hc_stack1_dnn_scaler.joblib
Model saved at inst/extdata/model/eugr_hc_stack1_dnn_best_model.joblib
Results saved at inst/extdata/model/eugr_hc_stack1_dnn_train_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack1_dnn_validation_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack1_dnn_test_prob.csv


In [27]:
prefix = 'eugr_hc_stack1_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_hc_stack1_dnn_independent_test_prob.csv


In [12]:
prefix = 'eugr_hc_stack1_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

100%|█| 19950/19950 [08:05<00:00, 41.08it/


Results saved at inst/extdata/model/eugr_hc_stack1_dnn_train_shap_values.csv


In [34]:
prefix = 'eugr_hc_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_hc_stack_rr_scaler.joblib
Model saved at inst/extdata/model/eugr_hc_stack_rr_best_model.joblib
Results saved at inst/extdata/model/eugr_hc_stack_rr_train_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack_rr_validation_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack_rr_test_prob.csv


In [28]:
prefix = 'eugr_hc_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_hc_stack_rr_independent_test_prob.csv


In [9]:
prefix = 'eugr_hc_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

Results saved at inst/extdata/model/eugr_hc_stack_rr_train_shap_values.csv


In [35]:
prefix = 'eugr_hc_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_hc_stack_rf_scaler.joblib
Model saved at inst/extdata/model/eugr_hc_stack_rf_best_model.joblib
Results saved at inst/extdata/model/eugr_hc_stack_rf_train_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack_rf_validation_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack_rf_test_prob.csv


In [29]:
prefix = 'eugr_hc_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_hc_stack_rf_independent_test_prob.csv


In [36]:
prefix = 'eugr_hc_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_hc_stack_gbm_scaler.joblib
Model saved at inst/extdata/model/eugr_hc_stack_gbm_best_model.joblib
Results saved at inst/extdata/model/eugr_hc_stack_gbm_train_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack_gbm_validation_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack_gbm_test_prob.csv


In [30]:
prefix = 'eugr_hc_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_hc_stack_gbm_independent_test_prob.csv


In [37]:
prefix = 'eugr_hc_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_hc_stack_dnn_scaler.joblib
Model saved at inst/extdata/model/eugr_hc_stack_dnn_best_model.joblib
Results saved at inst/extdata/model/eugr_hc_stack_dnn_train_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack_dnn_validation_prob.csv
Results saved at inst/extdata/model/eugr_hc_stack_dnn_test_prob.csv


In [31]:
prefix = 'eugr_hc_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_hc_stack_dnn_independent_test_prob.csv


## EUGR-BW prediction

In [39]:
prefix = 'eugr_bw_baseline2_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_bw_baseline2_rr_scaler.joblib
Model saved at inst/extdata/model/eugr_bw_baseline2_rr_best_model.joblib
Results saved at inst/extdata/model/eugr_bw_baseline2_rr_train_prob.csv
Results saved at inst/extdata/model/eugr_bw_baseline2_rr_validation_prob.csv
Results saved at inst/extdata/model/eugr_bw_baseline2_rr_test_prob.csv


In [32]:
prefix = 'eugr_bw_baseline2_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_bw_baseline2_rr_independent_test_prob.csv


In [10]:
prefix = 'eugr_bw_baseline2_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

Results saved at inst/extdata/model/eugr_bw_baseline2_rr_train_shap_values.csv


In [41]:
prefix = 'eugr_bw_stack1_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_bw_stack1_rr_scaler.joblib
Model saved at inst/extdata/model/eugr_bw_stack1_rr_best_model.joblib
Results saved at inst/extdata/model/eugr_bw_stack1_rr_train_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack1_rr_validation_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack1_rr_test_prob.csv


In [33]:
prefix = 'eugr_bw_stack1_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_bw_stack1_rr_independent_test_prob.csv


In [42]:
prefix = 'eugr_bw_stack1_rf'
model_name = 'RandomForest'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_bw_stack1_rf_scaler.joblib
Model saved at inst/extdata/model/eugr_bw_stack1_rf_best_model.joblib
Results saved at inst/extdata/model/eugr_bw_stack1_rf_train_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack1_rf_validation_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack1_rf_test_prob.csv


In [34]:
prefix = 'eugr_bw_stack1_rf'
model_name = 'RandomForest'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_bw_stack1_rf_independent_test_prob.csv


In [43]:
prefix = 'eugr_bw_stack1_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_bw_stack1_gbm_scaler.joblib
Model saved at inst/extdata/model/eugr_bw_stack1_gbm_best_model.joblib
Results saved at inst/extdata/model/eugr_bw_stack1_gbm_train_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack1_gbm_validation_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack1_gbm_test_prob.csv


In [35]:
prefix = 'eugr_bw_stack1_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_bw_stack1_gbm_independent_test_prob.csv


In [44]:
prefix = 'eugr_bw_stack1_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_bw_stack1_dnn_scaler.joblib
Model saved at inst/extdata/model/eugr_bw_stack1_dnn_best_model.joblib
Results saved at inst/extdata/model/eugr_bw_stack1_dnn_train_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack1_dnn_validation_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack1_dnn_test_prob.csv


In [36]:
prefix = 'eugr_bw_stack1_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_bw_stack1_dnn_independent_test_prob.csv


In [18]:
prefix = 'eugr_bw_stack1_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

100%|█| 19950/19950 [08:12<00:00, 40.50it/


Results saved at inst/extdata/model/eugr_bw_stack1_dnn_train_shap_values.csv


In [46]:
prefix = 'eugr_bw_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_bw_stack_rr_scaler.joblib
Model saved at inst/extdata/model/eugr_bw_stack_rr_best_model.joblib
Results saved at inst/extdata/model/eugr_bw_stack_rr_train_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack_rr_validation_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack_rr_test_prob.csv


In [37]:
prefix = 'eugr_bw_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_bw_stack_rr_independent_test_prob.csv


In [11]:
prefix = 'eugr_bw_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

Results saved at inst/extdata/model/eugr_bw_stack_rr_train_shap_values.csv


In [47]:
prefix = 'eugr_bw_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_bw_stack_rf_scaler.joblib
Model saved at inst/extdata/model/eugr_bw_stack_rf_best_model.joblib
Results saved at inst/extdata/model/eugr_bw_stack_rf_train_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack_rf_validation_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack_rf_test_prob.csv


In [38]:
prefix = 'eugr_bw_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_bw_stack_rf_independent_test_prob.csv


In [48]:
prefix = 'eugr_bw_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_bw_stack_gbm_scaler.joblib
Model saved at inst/extdata/model/eugr_bw_stack_gbm_best_model.joblib
Results saved at inst/extdata/model/eugr_bw_stack_gbm_train_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack_gbm_validation_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack_gbm_test_prob.csv


In [39]:
prefix = 'eugr_bw_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_bw_stack_gbm_independent_test_prob.csv


In [49]:
prefix = 'eugr_bw_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/eugr_bw_stack_dnn_scaler.joblib
Model saved at inst/extdata/model/eugr_bw_stack_dnn_best_model.joblib
Results saved at inst/extdata/model/eugr_bw_stack_dnn_train_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack_dnn_validation_prob.csv
Results saved at inst/extdata/model/eugr_bw_stack_dnn_test_prob.csv


In [40]:
prefix = 'eugr_bw_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/eugr_bw_stack_dnn_independent_test_prob.csv


## Failed hearing test prediction

In [51]:
prefix = 'hearing_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/hearing_stack_rr_scaler.joblib
Model saved at inst/extdata/model/hearing_stack_rr_best_model.joblib
Results saved at inst/extdata/model/hearing_stack_rr_train_prob.csv
Results saved at inst/extdata/model/hearing_stack_rr_validation_prob.csv
Results saved at inst/extdata/model/hearing_stack_rr_test_prob.csv


In [41]:
prefix = 'hearing_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/hearing_stack_rr_independent_test_prob.csv


In [12]:
prefix = 'hearing_stack_rr'
model_name = 'LogisticRegression'
model_dir = 'model'

compute_shap_values(prefix, 'train', explainers[model_name], model_dir)

Results saved at inst/extdata/model/hearing_stack_rr_train_shap_values.csv


In [52]:
prefix = 'hearing_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/hearing_stack_rf_scaler.joblib
Model saved at inst/extdata/model/hearing_stack_rf_best_model.joblib
Results saved at inst/extdata/model/hearing_stack_rf_train_prob.csv
Results saved at inst/extdata/model/hearing_stack_rf_validation_prob.csv
Results saved at inst/extdata/model/hearing_stack_rf_test_prob.csv


In [42]:
prefix = 'hearing_stack_rf'
model_name = 'RandomForest'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/hearing_stack_rf_independent_test_prob.csv


In [53]:
prefix = 'hearing_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/hearing_stack_gbm_scaler.joblib
Model saved at inst/extdata/model/hearing_stack_gbm_best_model.joblib
Results saved at inst/extdata/model/hearing_stack_gbm_train_prob.csv
Results saved at inst/extdata/model/hearing_stack_gbm_validation_prob.csv
Results saved at inst/extdata/model/hearing_stack_gbm_test_prob.csv


In [43]:
prefix = 'hearing_stack_gbm'
model_name = 'GradientBoosting'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/hearing_stack_gbm_independent_test_prob.csv


In [54]:
prefix = 'hearing_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

custom_precision = make_scorer(precision_score, zero_division=0)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=custom_precision)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/hearing_stack_dnn_scaler.joblib
Model saved at inst/extdata/model/hearing_stack_dnn_best_model.joblib
Results saved at inst/extdata/model/hearing_stack_dnn_train_prob.csv
Results saved at inst/extdata/model/hearing_stack_dnn_validation_prob.csv
Results saved at inst/extdata/model/hearing_stack_dnn_test_prob.csv


In [44]:
prefix = 'hearing_stack_dnn'
model_name = 'DeepNeuralNetwork'
model_dir = 'model'

output_type = 'probability'
load_and_predict(prefix, 'independent_test', output_type, model_dir)

Results saved at inst/extdata/model/hearing_stack_dnn_independent_test_prob.csv
