# Programming environment

In [1]:
# Define the seed for reproducibility
seed = 2024-9-10

In [2]:
# Load existing functions from libraries
from sklearn.metrics import mean_squared_error, make_scorer, precision_score

In [3]:
# Load custom functions from utils.py
from utils import train_and_save_model, load_and_predict

In [4]:
from sklearn.linear_model import LogisticRegression, Ridge
import numpy as np

# Define models and their parameter grids focused solely on Ridge models
models_and_params = {
    'LogisticRegression': {
        'model': LogisticRegression(penalty='l2', solver='lbfgs', max_iter=1000),
        'param_grid': {
            'C': np.logspace(-4, 4, 10)  # Logistic regression C parameter
        }
    },
    'RidgeRegression': {
        'model': Ridge(),
        'param_grid': {
            'alpha': np.logspace(-4, 4, 10)  # Ridge regression alpha parameter
        }
    }
}

# Predictive modeling

## Survival prediction

In [5]:
prefix = 'survive_baseline1'
model_name = 'LogisticRegression'
model_dir = 'model'

train_and_save_model(prefix, models_and_params[model_name], model_dir)

output_type = 'probability'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/survive_baseline1_scaler.joblib
Model saved at inst/extdata/model/survive_baseline1_best_model.joblib
Results saved at inst/extdata/model/survive_baseline1_train_prob.csv
Results saved at inst/extdata/model/survive_baseline1_validation_prob.csv
Results saved at inst/extdata/model/survive_baseline1_test_prob.csv


In [6]:
prefix = 'survive_residual1'
model_name = 'RidgeRegression'
model_dir = 'model'

neg_mse_scorer = make_scorer(mean_squared_error, greater_is_better=False)
train_and_save_model(prefix, models_and_params[model_name], model_dir, scoring=neg_mse_scorer, task = 'regression')

output_type = 'label'
load_and_predict(prefix, 'train', output_type, model_dir)
load_and_predict(prefix, 'validation', output_type, model_dir)
load_and_predict(prefix, 'test', output_type, model_dir)

Scaler saved at inst/extdata/model/survive_residual1_scaler.joblib
Model saved at inst/extdata/model/survive_residual1_best_model.joblib
Results saved at inst/extdata/model/survive_residual1_train_predictions.csv
Results saved at inst/extdata/model/survive_residual1_validation_predictions.csv
Results saved at inst/extdata/model/survive_residual1_test_predictions.csv
