# Tune "train-smaller" convergent-clustering model decision thresholds on validation set, and report performance (with and without tuning) on test set

This is run using train-smaller+validation+test, not train+test sets.

Use trained model APIs to do this.

In [1]:
from malid import config
from malid.train.training_utils import (
    evaluate_original_and_tuned_on_test_set,
    tune_on_validation_set,
)
from malid.trained_model_wrappers import ConvergentClusterClassifier
from malid.datamodels import (
    combine_classification_option_names,
)

In [2]:
for gene_locus in config.gene_loci_used:
    map_targets_to_output_dir = {
        target_obs_column: (
            config.paths.convergent_clusters_output_dir
            / gene_locus.name
            / combine_classification_option_names(target_obs_column)
        )  # output base dir should already exist
        for target_obs_column in config.classification_targets
    }
    print(gene_locus)
    clfs = tune_on_validation_set(
        gene_locus=gene_locus,
        targets=map_targets_to_output_dir,
        model_names=[
            "lasso_multiclass",
            "lasso_cv",
            "ridge_cv",
            "elasticnet_cv",
            "rf_multiclass",
            "xgboost",
            "linearsvm_ovr",
        ],
        model_class=ConvergentClusterClassifier,
    )
    evaluate_original_and_tuned_on_test_set(
        clfs=clfs, gene_locus=gene_locus, targets=map_targets_to_output_dir
    )

2022-12-30 23:41:21,159 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.0.validation.h5ad -> /srv/scratch/maximz/cache/1a7cd102c4a71eb472da3636203a91984ec407adbc0812ffba2c07c5.0.validation.h5ad


GeneLocus.BCR
Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 00:16:22,834 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 46 specimens




2022-12-31 00:26:16,727 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 40 specimens




2022-12-31 00:37:59,372 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 36 specimens




2022-12-31 00:50:54,483 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 12 specimens (365758 rows)


2022-12-31 00:51:03,725 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 56 specimens




2022-12-31 00:58:52,464 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 2 specimens (20035 rows)


2022-12-31 00:59:02,845 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 60 specimens




2022-12-31 01:08:37,460 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 2 specimens (20035 rows)


2022-12-31 01:08:47,838 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 60 specimens




2022-12-31 01:16:25,444 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtered to specimens with defined sex column - removed 1 specimens (13078 rows)


2022-12-31 01:16:35,928 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 61 specimens


2022-12-31 01:23:24,807 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.1.validation.h5ad -> /srv/scratch/maximz/cache/9c85c2a266a883a684e8c5d509b8321d4689380ae1339b1d3a20c9e8.1.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 01:55:50,855 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 42 specimens




2022-12-31 02:05:26,344 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 33 specimens




2022-12-31 02:17:08,378 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 35 specimens




2022-12-31 02:29:24,893 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 11 specimens (332120 rows)


2022-12-31 02:29:35,235 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 48 specimens




2022-12-31 02:40:13,224 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (5035 rows)


2022-12-31 02:40:25,015 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 54 specimens




2022-12-31 02:50:04,335 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (5035 rows)


2022-12-31 02:50:15,298 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 54 specimens




2022-12-31 02:58:36,624 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 55 specimens


2022-12-31 03:06:03,066 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.2.validation.h5ad -> /srv/scratch/maximz/cache/08c1068072d49c0e446bca7b2515cc6904c1583e869886f65b95c2db.2.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 03:47:41,751 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 44 specimens




2022-12-31 04:00:01,615 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 37 specimens




2022-12-31 04:14:07,961 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 35 specimens




2022-12-31 04:30:06,811 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 13 specimens (345033 rows)


2022-12-31 04:30:22,920 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 51 specimens




2022-12-31 04:42:28,644 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 3 specimens (59403 rows)


2022-12-31 04:42:45,898 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 56 specimens




2022-12-31 04:53:49,663 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 3 specimens (59403 rows)


2022-12-31 04:54:05,415 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 56 specimens




2022-12-31 05:04:13,267 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtered to specimens with defined sex column - removed 2 specimens (35834 rows)


2022-12-31 05:04:30,340 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 57 specimens


2022-12-31 05:13:44,908 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.-1.validation.h5ad -> /srv/scratch/maximz/cache/d12efe0f72cdefa66ff3f9089960fc16b89c64c2837b4b81d55fb8ed.-1.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].




2022-12-31 05:16:58,614 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 05:16:58,617 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 05:16:58,618 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 05:16:58,619 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 05:16:58,620 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 05:16:58,621 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease/train_smaller_model.xgboost.-1.joblib'


2022-12-31 05:16:58,622 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 05:19:13,348 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease_all_demographics_present/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 05:19:13,351 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease_all_demographics_present/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 05:19:13,352 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease_all_demographics_present/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 05:19:13,353 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease_all_demographics_present/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 05:19:13,354 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease_all_demographics_present/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 05:19:13,356 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease_all_demographics_present/train_smaller_model.xgboost.-1.joblib'


2022-12-31 05:19:13,357 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/disease_all_demographics_present/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 05:21:08,188 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 66 specimens


2022-12-31 05:21:10,150 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/covid_vs_healthy/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 05:21:10,151 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/covid_vs_healthy/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 05:21:10,152 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/covid_vs_healthy/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 05:21:10,153 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/covid_vs_healthy/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 05:21:10,154 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/covid_vs_healthy/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 05:21:10,155 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/covid_vs_healthy/train_smaller_model.xgboost.-1.joblib'


2022-12-31 05:21:10,156 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/covid_vs_healthy/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 05:23:05,329 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 53 specimens


2022-12-31 05:23:07,400 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/hiv_vs_healthy/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 05:23:07,401 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/hiv_vs_healthy/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 05:23:07,402 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/hiv_vs_healthy/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 05:23:07,403 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/hiv_vs_healthy/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 05:23:07,404 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/hiv_vs_healthy/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 05:23:07,405 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/hiv_vs_healthy/train_smaller_model.xgboost.-1.joblib'


2022-12-31 05:23:07,406 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/hiv_vs_healthy/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 05:24:40,285 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 53 specimens


2022-12-31 05:24:42,092 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/lupus_vs_healthy/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 05:24:42,094 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/lupus_vs_healthy/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 05:24:42,095 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/lupus_vs_healthy/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 05:24:42,095 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/lupus_vs_healthy/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 05:24:42,096 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/lupus_vs_healthy/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 05:24:42,097 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/lupus_vs_healthy/train_smaller_model.xgboost.-1.joblib'


2022-12-31 05:24:42,098 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/lupus_vs_healthy/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 05:27:11,059 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 20 specimens (485965 rows)


2022-12-31 05:28:47,547 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 75 specimens


2022-12-31 05:30:35,006 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/ethnicity_condensed_healthy_only/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 05:30:35,013 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/ethnicity_condensed_healthy_only/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 05:30:35,015 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/ethnicity_condensed_healthy_only/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 05:30:35,016 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/ethnicity_condensed_healthy_only/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 05:30:35,017 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/ethnicity_condensed_healthy_only/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 05:30:35,018 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/ethnicity_condensed_healthy_only/train_smaller_model.xgboost.-1.joblib'


2022-12-31 05:30:35,019 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/ethnicity_condensed_healthy_only/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 05:32:18,879 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 2 specimens (35185 rows)


2022-12-31 05:32:46,037 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 84 specimens


2022-12-31 05:33:15,205 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_healthy_only/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 05:33:15,207 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_healthy_only/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 05:33:15,208 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_healthy_only/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 05:33:15,209 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_healthy_only/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 05:33:15,211 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_healthy_only/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 05:33:15,212 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_healthy_only/train_smaller_model.xgboost.-1.joblib'


2022-12-31 05:33:15,213 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_healthy_only/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 05:35:08,781 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 2 specimens (35185 rows)


2022-12-31 05:35:33,729 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 84 specimens


2022-12-31 05:36:00,079 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_binary_healthy_only/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 05:36:00,081 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_binary_healthy_only/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 05:36:00,082 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_binary_healthy_only/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 05:36:00,083 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_binary_healthy_only/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 05:36:00,084 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_binary_healthy_only/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 05:36:00,085 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_binary_healthy_only/train_smaller_model.xgboost.-1.joblib'


2022-12-31 05:36:00,086 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/age_group_binary_healthy_only/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 05:37:30,054 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtered to specimens with defined sex column - removed 1 specimens (11616 rows)


2022-12-31 05:37:54,677 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 85 specimens


2022-12-31 05:38:20,775 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/sex_healthy_only/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 05:38:20,777 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/sex_healthy_only/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 05:38:20,779 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/sex_healthy_only/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 05:38:20,780 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/sex_healthy_only/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 05:38:20,781 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/sex_healthy_only/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 05:38:20,782 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/sex_healthy_only/train_smaller_model.xgboost.-1.joblib'


2022-12-31 05:38:20,783 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/BCR/sex_healthy_only/train_smaller_model.linearsvm_ovr.-1.joblib'


GeneLocus.BCR TargetObsColumnEnum.disease


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.912 +/- 0.010 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.917 +/- 0.004 (in 3 folds),0.930 +/- 0.004 (in 3 folds),0.750 +/- 0.010 (in 3 folds),0.641 +/- 0.021 (in 3 folds),0.75,0.637,0.743 +/- 0.019 (in 3 folds),0.633 +/- 0.027 (in 3 folds),...,0.931 +/- 0.005 (in 2 folds),0.743,0.628,0.009,Unknown,320,3,323,0.009288,False
lasso_multiclass.decision_thresholds_tuned,0.912 +/- 0.010 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.917 +/- 0.004 (in 3 folds),0.930 +/- 0.004 (in 3 folds),0.775 +/- 0.018 (in 3 folds),0.676 +/- 0.010 (in 3 folds),0.775,0.669,0.768 +/- 0.030 (in 3 folds),0.666 +/- 0.024 (in 3 folds),...,0.931 +/- 0.005 (in 2 folds),0.768,0.659,0.009,Unknown,320,3,323,0.009288,False
linearsvm_ovr,0.912 +/- 0.004 (in 3 folds),0.922 +/- 0.004 (in 3 folds),0.919 +/- 0.007 (in 3 folds),0.931 +/- 0.006 (in 3 folds),0.754 +/- 0.012 (in 3 folds),0.647 +/- 0.017 (in 3 folds),0.754,0.643,0.749 +/- 0.005 (in 3 folds),0.642 +/- 0.008 (in 3 folds),...,0.934 +/- 0.004 (in 2 folds),0.749,0.638,0.006,Unknown,321,2,323,0.006192,False
linearsvm_ovr.decision_thresholds_tuned,0.912 +/- 0.004 (in 3 folds),0.922 +/- 0.004 (in 3 folds),0.919 +/- 0.007 (in 3 folds),0.931 +/- 0.006 (in 3 folds),0.776 +/- 0.004 (in 3 folds),0.686 +/- 0.003 (in 3 folds),0.776,0.676,0.771 +/- 0.009 (in 3 folds),0.681 +/- 0.008 (in 3 folds),...,0.934 +/- 0.004 (in 2 folds),0.771,0.67,0.006,Unknown,321,2,323,0.006192,False
ridge_cv,0.903 +/- 0.002 (in 3 folds),0.915 +/- 0.003 (in 3 folds),0.905 +/- 0.006 (in 3 folds),0.920 +/- 0.002 (in 3 folds),0.563 +/- 0.077 (in 3 folds),0.337 +/- 0.138 (in 3 folds),0.562,0.344,0.561 +/- 0.078 (in 3 folds),0.335 +/- 0.138 (in 3 folds),...,0.920 +/- 0.003 (in 2 folds),0.56,0.342,0.003,Unknown,322,1,323,0.003096,False
ridge_cv.decision_thresholds_tuned,0.903 +/- 0.002 (in 3 folds),0.915 +/- 0.003 (in 3 folds),0.905 +/- 0.006 (in 3 folds),0.920 +/- 0.002 (in 3 folds),0.786 +/- 0.015 (in 3 folds),0.691 +/- 0.018 (in 3 folds),0.786,0.691,0.783 +/- 0.019 (in 3 folds),0.688 +/- 0.022 (in 3 folds),...,0.920 +/- 0.003 (in 2 folds),0.783,0.688,0.003,Unknown,322,1,323,0.003096,False
lasso_cv,0.897 +/- 0.017 (in 3 folds),0.907 +/- 0.018 (in 3 folds),0.903 +/- 0.012 (in 3 folds),0.916 +/- 0.012 (in 3 folds),0.532 +/- 0.035 (in 3 folds),0.284 +/- 0.068 (in 3 folds),0.531,0.287,0.524 +/- 0.041 (in 3 folds),0.266 +/- 0.089 (in 3 folds),...,0.921 +/- 0.000 (in 1 folds),0.523,0.268,0.015,Unknown,318,5,323,0.01548,True
lasso_cv.decision_thresholds_tuned,0.897 +/- 0.017 (in 3 folds),0.907 +/- 0.018 (in 3 folds),0.903 +/- 0.012 (in 3 folds),0.916 +/- 0.012 (in 3 folds),0.789 +/- 0.012 (in 3 folds),0.695 +/- 0.011 (in 3 folds),0.789,0.693,0.777 +/- 0.020 (in 3 folds),0.679 +/- 0.018 (in 3 folds),...,0.921 +/- 0.000 (in 1 folds),0.777,0.677,0.015,Unknown,318,5,323,0.01548,False
rf_multiclass,0.889 +/- 0.024 (in 3 folds),0.896 +/- 0.025 (in 3 folds),0.885 +/- 0.024 (in 3 folds),0.894 +/- 0.023 (in 3 folds),0.740 +/- 0.022 (in 3 folds),0.616 +/- 0.034 (in 3 folds),0.74,0.613,0.731 +/- 0.032 (in 3 folds),0.606 +/- 0.046 (in 3 folds),...,0.888 +/- 0.000 (in 1 folds),0.731,0.602,0.012,Unknown,319,4,323,0.012384,False
rf_multiclass.decision_thresholds_tuned,0.889 +/- 0.024 (in 3 folds),0.896 +/- 0.025 (in 3 folds),0.885 +/- 0.024 (in 3 folds),0.894 +/- 0.023 (in 3 folds),0.771 +/- 0.014 (in 3 folds),0.669 +/- 0.017 (in 3 folds),0.771,0.665,0.762 +/- 0.025 (in 3 folds),0.658 +/- 0.029 (in 3 folds),...,0.888 +/- 0.000 (in 1 folds),0.762,0.654,0.012,Unknown,319,4,323,0.012384,False


GeneLocus.BCR TargetObsColumnEnum.disease_all_demographics_present


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
linearsvm_ovr,0.914 +/- 0.004 (in 3 folds),0.924 +/- 0.006 (in 3 folds),0.921 +/- 0.006 (in 3 folds),0.931 +/- 0.009 (in 3 folds),0.746 +/- 0.026 (in 3 folds),0.620 +/- 0.030 (in 3 folds),0.746,0.62,0.741 +/- 0.029 (in 3 folds),0.614 +/- 0.030 (in 3 folds),...,Unknown,283,2,285,0.007018,False,0.910 +/- 0.000 (in 1 folds),0.916 +/- 0.000 (in 1 folds),0.916 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds)
linearsvm_ovr.decision_thresholds_tuned,0.914 +/- 0.004 (in 3 folds),0.924 +/- 0.006 (in 3 folds),0.921 +/- 0.006 (in 3 folds),0.931 +/- 0.009 (in 3 folds),0.756 +/- 0.044 (in 3 folds),0.666 +/- 0.014 (in 3 folds),0.756,0.647,0.751 +/- 0.047 (in 3 folds),0.659 +/- 0.016 (in 3 folds),...,Unknown,283,2,285,0.007018,False,0.910 +/- 0.000 (in 1 folds),0.916 +/- 0.000 (in 1 folds),0.916 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds)
lasso_multiclass,0.911 +/- 0.014 (in 3 folds),0.921 +/- 0.013 (in 3 folds),0.920 +/- 0.014 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.738 +/- 0.028 (in 3 folds),0.622 +/- 0.043 (in 3 folds),0.738,0.618,0.730 +/- 0.028 (in 3 folds),0.613 +/- 0.042 (in 3 folds),...,Unknown,282,3,285,0.010526,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.911 +/- 0.014 (in 3 folds),0.921 +/- 0.013 (in 3 folds),0.920 +/- 0.014 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.773 +/- 0.060 (in 3 folds),0.694 +/- 0.038 (in 3 folds),0.773,0.685,0.765 +/- 0.059 (in 3 folds),0.683 +/- 0.037 (in 3 folds),...,Unknown,282,3,285,0.010526,False,,,,
ridge_cv,0.900 +/- 0.015 (in 3 folds),0.912 +/- 0.017 (in 3 folds),0.902 +/- 0.025 (in 3 folds),0.916 +/- 0.027 (in 3 folds),0.534 +/- 0.111 (in 3 folds),0.171 +/- 0.296 (in 3 folds),0.535,0.292,0.508 +/- 0.120 (in 3 folds),0.193 +/- 0.256 (in 3 folds),...,Unknown,271,14,285,0.049123,False,,,,
ridge_cv.decision_thresholds_tuned,0.900 +/- 0.015 (in 3 folds),0.912 +/- 0.017 (in 3 folds),0.902 +/- 0.025 (in 3 folds),0.916 +/- 0.027 (in 3 folds),0.478 +/- 0.354 (in 3 folds),0.241 +/- 0.417 (in 3 folds),0.476,0.277,0.453 +/- 0.349 (in 3 folds),0.228 +/- 0.421 (in 3 folds),...,Unknown,271,14,285,0.049123,False,,,,
xgboost,0.890 +/- 0.015 (in 3 folds),0.894 +/- 0.021 (in 3 folds),0.899 +/- 0.017 (in 3 folds),0.907 +/- 0.024 (in 3 folds),0.728 +/- 0.016 (in 3 folds),0.593 +/- 0.040 (in 3 folds),0.728,0.592,0.712 +/- 0.006 (in 3 folds),0.574 +/- 0.022 (in 3 folds),...,Unknown,279,6,285,0.021053,False,0.874 +/- 0.000 (in 1 folds),0.870 +/- 0.000 (in 1 folds),0.880 +/- 0.000 (in 1 folds),0.880 +/- 0.000 (in 1 folds)
xgboost.decision_thresholds_tuned,0.890 +/- 0.015 (in 3 folds),0.894 +/- 0.021 (in 3 folds),0.899 +/- 0.017 (in 3 folds),0.907 +/- 0.024 (in 3 folds),0.771 +/- 0.008 (in 3 folds),0.666 +/- 0.014 (in 3 folds),0.771,0.661,0.755 +/- 0.023 (in 3 folds),0.645 +/- 0.022 (in 3 folds),...,Unknown,279,6,285,0.021053,False,0.874 +/- 0.000 (in 1 folds),0.870 +/- 0.000 (in 1 folds),0.880 +/- 0.000 (in 1 folds),0.880 +/- 0.000 (in 1 folds)
lasso_cv,0.884 +/- 0.031 (in 3 folds),0.898 +/- 0.030 (in 3 folds),0.888 +/- 0.032 (in 3 folds),0.905 +/- 0.032 (in 3 folds),0.588 +/- 0.142 (in 3 folds),0.380 +/- 0.206 (in 3 folds),0.587,0.376,0.584 +/- 0.144 (in 3 folds),0.367 +/- 0.212 (in 3 folds),...,Unknown,283,2,285,0.007018,False,0.850 +/- 0.000 (in 1 folds),0.867 +/- 0.000 (in 1 folds),0.851 +/- 0.000 (in 1 folds),0.868 +/- 0.000 (in 1 folds)
lasso_cv.decision_thresholds_tuned,0.884 +/- 0.031 (in 3 folds),0.898 +/- 0.030 (in 3 folds),0.888 +/- 0.032 (in 3 folds),0.905 +/- 0.032 (in 3 folds),0.760 +/- 0.015 (in 3 folds),0.653 +/- 0.047 (in 3 folds),0.76,0.651,0.754 +/- 0.011 (in 3 folds),0.644 +/- 0.040 (in 3 folds),...,Unknown,283,2,285,0.007018,False,0.850 +/- 0.000 (in 1 folds),0.867 +/- 0.000 (in 1 folds),0.851 +/- 0.000 (in 1 folds),0.868 +/- 0.000 (in 1 folds)


GeneLocus.BCR TargetObsColumnEnum.covid_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.994 +/- 0.001 (in 3 folds),0.994 +/- 0.001 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.963 +/- 0.018 (in 3 folds),0.903 +/- 0.041 (in 3 folds),0.963,0.898,0.953 +/- 0.016 (in 3 folds),0.876 +/- 0.031 (in 3 folds),...,0.998 +/- 0.000 (in 1 folds),0.953,0.873,0.01,Unknown,189,2,191,0.010471,False
linearsvm_ovr.decision_thresholds_tuned,0.994 +/- 0.001 (in 3 folds),0.994 +/- 0.001 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.974 +/- 0.009 (in 3 folds),0.923 +/- 0.025 (in 3 folds),0.974,0.922,0.963 +/- 0.009 (in 3 folds),0.895 +/- 0.021 (in 3 folds),...,0.998 +/- 0.000 (in 1 folds),0.963,0.894,0.01,Unknown,189,2,191,0.010471,False
ridge_cv,0.992 +/- 0.004 (in 3 folds),0.992 +/- 0.004 (in 3 folds),0.998 +/- 0.001 (in 3 folds),0.998 +/- 0.001 (in 3 folds),0.789 +/- 0.013 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.789,0.0,0.764 +/- 0.004 (in 3 folds),0.070 +/- 0.040 (in 3 folds),...,,0.764,0.061,0.031,Unknown,185,6,191,0.031414,True
ridge_cv.decision_thresholds_tuned,0.992 +/- 0.004 (in 3 folds),0.992 +/- 0.004 (in 3 folds),0.998 +/- 0.001 (in 3 folds),0.998 +/- 0.001 (in 3 folds),0.789 +/- 0.013 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.789,0.0,0.764 +/- 0.004 (in 3 folds),0.070 +/- 0.040 (in 3 folds),...,,0.764,0.061,0.031,Unknown,185,6,191,0.031414,True
lasso_multiclass,0.992 +/- 0.003 (in 3 folds),0.992 +/- 0.003 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.963 +/- 0.018 (in 3 folds),0.897 +/- 0.048 (in 3 folds),0.963,0.892,0.953 +/- 0.016 (in 3 folds),0.870 +/- 0.041 (in 3 folds),...,0.998 +/- 0.000 (in 1 folds),0.953,0.866,0.01,Unknown,189,2,191,0.010471,False
lasso_multiclass.decision_thresholds_tuned,0.992 +/- 0.003 (in 3 folds),0.992 +/- 0.003 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.968 +/- 0.016 (in 3 folds),0.913 +/- 0.036 (in 3 folds),0.968,0.909,0.958 +/- 0.019 (in 3 folds),0.886 +/- 0.037 (in 3 folds),...,0.998 +/- 0.000 (in 1 folds),0.958,0.883,0.01,Unknown,189,2,191,0.010471,False
elasticnet_cv,0.990 +/- 0.008 (in 3 folds),0.990 +/- 0.008 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.803 +/- 0.017 (in 3 folds),0.275 +/- 0.057 (in 3 folds),0.803,0.279,0.790 +/- 0.038 (in 3 folds),0.242 +/- 0.102 (in 3 folds),...,0.996 +/- 0.001 (in 2 folds),0.791,0.22,0.016,Unknown,188,3,191,0.015707,False
elasticnet_cv.decision_thresholds_tuned,0.990 +/- 0.008 (in 3 folds),0.990 +/- 0.008 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.963 +/- 0.017 (in 3 folds),0.890 +/- 0.057 (in 3 folds),0.963,0.889,0.948 +/- 0.010 (in 3 folds),0.854 +/- 0.007 (in 3 folds),...,0.996 +/- 0.001 (in 2 folds),0.948,0.847,0.016,Unknown,188,3,191,0.015707,False
rf_multiclass,0.989 +/- 0.004 (in 3 folds),0.989 +/- 0.004 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.947 +/- 0.025 (in 3 folds),0.853 +/- 0.064 (in 3 folds),0.947,0.851,0.937 +/- 0.032 (in 3 folds),0.831 +/- 0.079 (in 3 folds),...,0.997 +/- 0.000 (in 1 folds),0.937,0.828,0.01,Unknown,189,2,191,0.010471,False
rf_multiclass.decision_thresholds_tuned,0.989 +/- 0.004 (in 3 folds),0.989 +/- 0.004 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.968 +/- 0.001 (in 3 folds),0.906 +/- 0.004 (in 3 folds),0.968,0.905,0.958 +/- 0.010 (in 3 folds),0.878 +/- 0.028 (in 3 folds),...,0.997 +/- 0.000 (in 1 folds),0.958,0.878,0.01,Unknown,189,2,191,0.010471,False


GeneLocus.BCR TargetObsColumnEnum.hiv_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.975 +/- 0.008 (in 3 folds),0.975 +/- 0.008 (in 3 folds),0.987 +/- 0.006 (in 3 folds),0.987 +/- 0.006 (in 3 folds),0.811 +/- 0.087 (in 3 folds),0.539 +/- 0.236 (in 3 folds),0.808,0.556,0.752 +/- 0.066 (in 3 folds),0.386 +/- 0.237 (in 3 folds),...,Unknown,198,15,213,0.070423,False,,,,
elasticnet_cv.decision_thresholds_tuned,0.975 +/- 0.008 (in 3 folds),0.975 +/- 0.008 (in 3 folds),0.987 +/- 0.006 (in 3 folds),0.987 +/- 0.006 (in 3 folds),0.929 +/- 0.023 (in 3 folds),0.843 +/- 0.054 (in 3 folds),0.929,0.843,0.863 +/- 0.033 (in 3 folds),0.732 +/- 0.058 (in 3 folds),...,Unknown,198,15,213,0.070423,False,,,,
ridge_cv,0.973 +/- 0.005 (in 3 folds),0.973 +/- 0.005 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.701 +/- 0.006 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.701,0.0,0.695 +/- 0.014 (in 3 folds),0.012 +/- 0.021 (in 3 folds),...,Unknown,211,2,213,0.00939,True,0.972 +/- 0.007 (in 2 folds),0.972 +/- 0.007 (in 2 folds),0.988 +/- 0.004 (in 2 folds),0.988 +/- 0.004 (in 2 folds)
ridge_cv.decision_thresholds_tuned,0.973 +/- 0.005 (in 3 folds),0.973 +/- 0.005 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.701 +/- 0.006 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.701,0.0,0.695 +/- 0.014 (in 3 folds),0.012 +/- 0.021 (in 3 folds),...,Unknown,211,2,213,0.00939,True,0.972 +/- 0.007 (in 2 folds),0.972 +/- 0.007 (in 2 folds),0.988 +/- 0.004 (in 2 folds),0.988 +/- 0.004 (in 2 folds)
linearsvm_ovr,0.971 +/- 0.009 (in 3 folds),0.971 +/- 0.009 (in 3 folds),0.986 +/- 0.006 (in 3 folds),0.986 +/- 0.006 (in 3 folds),0.924 +/- 0.015 (in 3 folds),0.821 +/- 0.034 (in 3 folds),0.924,0.816,0.911 +/- 0.020 (in 3 folds),0.795 +/- 0.037 (in 3 folds),...,Unknown,210,3,213,0.014085,False,0.979 +/- 0.000 (in 1 folds),0.979 +/- 0.000 (in 1 folds),0.991 +/- 0.000 (in 1 folds),0.991 +/- 0.000 (in 1 folds)
linearsvm_ovr.decision_thresholds_tuned,0.971 +/- 0.009 (in 3 folds),0.971 +/- 0.009 (in 3 folds),0.986 +/- 0.006 (in 3 folds),0.986 +/- 0.006 (in 3 folds),0.943 +/- 0.002 (in 3 folds),0.863 +/- 0.003 (in 3 folds),0.943,0.863,0.930 +/- 0.014 (in 3 folds),0.835 +/- 0.028 (in 3 folds),...,Unknown,210,3,213,0.014085,False,0.979 +/- 0.000 (in 1 folds),0.979 +/- 0.000 (in 1 folds),0.991 +/- 0.000 (in 1 folds),0.991 +/- 0.000 (in 1 folds)
lasso_cv,0.969 +/- 0.015 (in 3 folds),0.969 +/- 0.015 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.887 +/- 0.009 (in 3 folds),0.736 +/- 0.016 (in 3 folds),0.887,0.735,0.850 +/- 0.032 (in 3 folds),0.649 +/- 0.072 (in 3 folds),...,Unknown,204,9,213,0.042254,False,,,,
lasso_cv.decision_thresholds_tuned,0.969 +/- 0.015 (in 3 folds),0.969 +/- 0.015 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.932 +/- 0.022 (in 3 folds),0.844 +/- 0.054 (in 3 folds),0.931,0.841,0.892 +/- 0.019 (in 3 folds),0.772 +/- 0.034 (in 3 folds),...,Unknown,204,9,213,0.042254,False,,,,
lasso_multiclass,0.969 +/- 0.006 (in 3 folds),0.969 +/- 0.006 (in 3 folds),0.985 +/- 0.005 (in 3 folds),0.985 +/- 0.005 (in 3 folds),0.933 +/- 0.016 (in 3 folds),0.839 +/- 0.041 (in 3 folds),0.933,0.839,0.911 +/- 0.020 (in 3 folds),0.793 +/- 0.049 (in 3 folds),...,Unknown,208,5,213,0.023474,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.969 +/- 0.006 (in 3 folds),0.969 +/- 0.006 (in 3 folds),0.985 +/- 0.005 (in 3 folds),0.985 +/- 0.005 (in 3 folds),0.942 +/- 0.001 (in 3 folds),0.863 +/- 0.002 (in 3 folds),0.942,0.862,0.920 +/- 0.006 (in 3 folds),0.817 +/- 0.011 (in 3 folds),...,Unknown,208,5,213,0.023474,False,,,,


GeneLocus.BCR TargetObsColumnEnum.lupus_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,...,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.863 +/- 0.029 (in 3 folds),0.863 +/- 0.029 (in 3 folds),0.739 +/- 0.118 (in 3 folds),0.739 +/- 0.118 (in 3 folds),0.747 +/- 0.046 (in 3 folds),0.389 +/- 0.152 (in 3 folds),0.747,0.387,,,...,0.275 +/- 0.183 (in 3 folds),0.544,0.206,0.272,Unknown,158,59,217,0.271889,False
elasticnet_cv.decision_thresholds_tuned,0.863 +/- 0.029 (in 3 folds),0.863 +/- 0.029 (in 3 folds),0.739 +/- 0.118 (in 3 folds),0.739 +/- 0.118 (in 3 folds),0.814 +/- 0.050 (in 3 folds),0.618 +/- 0.061 (in 3 folds),0.823,0.603,,,...,0.275 +/- 0.183 (in 3 folds),0.599,0.367,0.272,Unknown,158,59,217,0.271889,False
linearsvm_ovr,0.863 +/- 0.016 (in 3 folds),0.863 +/- 0.016 (in 3 folds),0.780 +/- 0.027 (in 3 folds),0.780 +/- 0.027 (in 3 folds),0.821 +/- 0.060 (in 3 folds),0.581 +/- 0.141 (in 3 folds),0.821,0.576,0.853 +/- 0.000 (in 1 folds),0.853 +/- 0.000 (in 1 folds),...,0.034 +/- 0.028 (in 2 folds),0.802,0.545,0.023,Unknown,212,5,217,0.023041,False
linearsvm_ovr.decision_thresholds_tuned,0.863 +/- 0.016 (in 3 folds),0.863 +/- 0.016 (in 3 folds),0.780 +/- 0.027 (in 3 folds),0.780 +/- 0.027 (in 3 folds),0.835 +/- 0.044 (in 3 folds),0.618 +/- 0.102 (in 3 folds),0.835,0.605,0.853 +/- 0.000 (in 1 folds),0.853 +/- 0.000 (in 1 folds),...,0.034 +/- 0.028 (in 2 folds),0.816,0.57,0.023,Unknown,212,5,217,0.023041,False
lasso_cv,0.862 +/- 0.035 (in 3 folds),0.862 +/- 0.035 (in 3 folds),0.766 +/- 0.075 (in 3 folds),0.766 +/- 0.075 (in 3 folds),0.764 +/- 0.031 (in 3 folds),0.436 +/- 0.111 (in 3 folds),0.762,0.424,,,...,0.147 +/- 0.087 (in 3 folds),0.65,0.271,0.147,Unknown,185,32,217,0.147465,False
lasso_cv.decision_thresholds_tuned,0.862 +/- 0.035 (in 3 folds),0.862 +/- 0.035 (in 3 folds),0.766 +/- 0.075 (in 3 folds),0.766 +/- 0.075 (in 3 folds),0.838 +/- 0.026 (in 3 folds),0.628 +/- 0.072 (in 3 folds),0.838,0.624,,,...,0.147 +/- 0.087 (in 3 folds),0.714,0.453,0.147,Unknown,185,32,217,0.147465,False
lasso_multiclass,0.859 +/- 0.022 (in 3 folds),0.859 +/- 0.022 (in 3 folds),0.771 +/- 0.036 (in 3 folds),0.771 +/- 0.036 (in 3 folds),0.821 +/- 0.060 (in 3 folds),0.581 +/- 0.141 (in 3 folds),0.821,0.576,0.849 +/- 0.000 (in 1 folds),0.849 +/- 0.000 (in 1 folds),...,0.034 +/- 0.028 (in 2 folds),0.802,0.545,0.023,Unknown,212,5,217,0.023041,False
lasso_multiclass.decision_thresholds_tuned,0.859 +/- 0.022 (in 3 folds),0.859 +/- 0.022 (in 3 folds),0.771 +/- 0.036 (in 3 folds),0.771 +/- 0.036 (in 3 folds),0.808 +/- 0.080 (in 3 folds),0.609 +/- 0.109 (in 3 folds),0.807,0.596,0.849 +/- 0.000 (in 1 folds),0.849 +/- 0.000 (in 1 folds),...,0.034 +/- 0.028 (in 2 folds),0.788,0.569,0.023,Unknown,212,5,217,0.023041,False
rf_multiclass,0.829 +/- 0.034 (in 3 folds),0.829 +/- 0.034 (in 3 folds),0.759 +/- 0.071 (in 3 folds),0.759 +/- 0.071 (in 3 folds),0.808 +/- 0.059 (in 3 folds),0.557 +/- 0.143 (in 3 folds),0.809,0.549,,,...,0.105 +/- 0.124 (in 3 folds),0.724,0.436,0.106,Unknown,194,23,217,0.105991,False
rf_multiclass.decision_thresholds_tuned,0.829 +/- 0.034 (in 3 folds),0.829 +/- 0.034 (in 3 folds),0.759 +/- 0.071 (in 3 folds),0.759 +/- 0.071 (in 3 folds),0.846 +/- 0.031 (in 3 folds),0.637 +/- 0.096 (in 3 folds),0.845,0.639,,,...,0.105 +/- 0.124 (in 3 folds),0.756,0.47,0.106,Unknown,194,23,217,0.105991,False


GeneLocus.BCR TargetObsColumnEnum.ethnicity_condensed_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.654 +/- 0.053 (in 3 folds),0.654 +/- 0.033 (in 3 folds),0.671 +/- 0.069 (in 3 folds),0.683 +/- 0.041 (in 3 folds),0.568 +/- 0.108 (in 3 folds),0.148 +/- 0.257 (in 3 folds),0.565,0.261,0.463 +/- 0.074 (in 3 folds),0.194 +/- 0.115 (in 3 folds),...,Unknown,108,24,132,0.181818,True,,,,
elasticnet_cv.decision_thresholds_tuned,0.654 +/- 0.053 (in 3 folds),0.654 +/- 0.033 (in 3 folds),0.671 +/- 0.069 (in 3 folds),0.683 +/- 0.041 (in 3 folds),0.583 +/- 0.043 (in 3 folds),0.439 +/- 0.079 (in 3 folds),0.583,0.372,0.480 +/- 0.062 (in 3 folds),0.318 +/- 0.076 (in 3 folds),...,Unknown,108,24,132,0.181818,False,,,,
lasso_cv,0.633 +/- 0.068 (in 3 folds),0.621 +/- 0.056 (in 3 folds),0.655 +/- 0.085 (in 3 folds),0.651 +/- 0.062 (in 3 folds),0.519 +/- 0.120 (in 3 folds),0.069 +/- 0.119 (in 3 folds),0.513,0.15,0.437 +/- 0.056 (in 3 folds),0.131 +/- 0.051 (in 3 folds),...,Unknown,113,19,132,0.143939,True,,,,
lasso_cv.decision_thresholds_tuned,0.633 +/- 0.068 (in 3 folds),0.621 +/- 0.056 (in 3 folds),0.655 +/- 0.085 (in 3 folds),0.651 +/- 0.062 (in 3 folds),0.598 +/- 0.097 (in 3 folds),0.433 +/- 0.112 (in 3 folds),0.602,0.4,0.518 +/- 0.132 (in 3 folds),0.357 +/- 0.139 (in 3 folds),...,Unknown,113,19,132,0.143939,False,,,,
rf_multiclass,0.628 +/- 0.041 (in 3 folds),0.622 +/- 0.029 (in 3 folds),0.636 +/- 0.023 (in 3 folds),0.618 +/- 0.014 (in 3 folds),0.579 +/- 0.026 (in 3 folds),0.295 +/- 0.101 (in 3 folds),0.581,0.318,0.543 +/- 0.061 (in 3 folds),0.257 +/- 0.071 (in 3 folds),...,Unknown,124,8,132,0.060606,True,0.634 +/- 0.000 (in 1 folds),0.634 +/- 0.000 (in 1 folds),0.619 +/- 0.000 (in 1 folds),0.605 +/- 0.000 (in 1 folds)
rf_multiclass.decision_thresholds_tuned,0.628 +/- 0.041 (in 3 folds),0.622 +/- 0.029 (in 3 folds),0.636 +/- 0.023 (in 3 folds),0.618 +/- 0.014 (in 3 folds),0.633 +/- 0.054 (in 3 folds),0.432 +/- 0.011 (in 3 folds),0.637,0.43,0.595 +/- 0.093 (in 3 folds),0.381 +/- 0.051 (in 3 folds),...,Unknown,124,8,132,0.060606,True,0.634 +/- 0.000 (in 1 folds),0.634 +/- 0.000 (in 1 folds),0.619 +/- 0.000 (in 1 folds),0.605 +/- 0.000 (in 1 folds)
ridge_cv,0.618 +/- 0.107 (in 3 folds),0.636 +/- 0.120 (in 3 folds),0.621 +/- 0.117 (in 3 folds),0.647 +/- 0.132 (in 3 folds),0.529 +/- 0.111 (in 3 folds),0.059 +/- 0.101 (in 3 folds),0.528,0.115,0.430 +/- 0.061 (in 3 folds),0.129 +/- 0.048 (in 3 folds),...,Unknown,108,24,132,0.181818,True,,,,
ridge_cv.decision_thresholds_tuned,0.618 +/- 0.107 (in 3 folds),0.636 +/- 0.120 (in 3 folds),0.621 +/- 0.117 (in 3 folds),0.647 +/- 0.132 (in 3 folds),0.353 +/- 0.251 (in 3 folds),0.157 +/- 0.273 (in 3 folds),0.361,0.105,0.295 +/- 0.217 (in 3 folds),0.094 +/- 0.252 (in 3 folds),...,Unknown,108,24,132,0.181818,True,,,,
xgboost,0.595 +/- 0.039 (in 3 folds),0.578 +/- 0.037 (in 3 folds),0.641 +/- 0.055 (in 3 folds),0.626 +/- 0.046 (in 3 folds),0.573 +/- 0.008 (in 3 folds),0.285 +/- 0.143 (in 3 folds),0.573,0.307,0.536 +/- 0.042 (in 3 folds),0.248 +/- 0.116 (in 3 folds),...,Unknown,124,8,132,0.060606,False,0.576 +/- 0.000 (in 1 folds),0.578 +/- 0.000 (in 1 folds),0.588 +/- 0.000 (in 1 folds),0.589 +/- 0.000 (in 1 folds)
xgboost.decision_thresholds_tuned,0.595 +/- 0.039 (in 3 folds),0.578 +/- 0.037 (in 3 folds),0.641 +/- 0.055 (in 3 folds),0.626 +/- 0.046 (in 3 folds),0.534 +/- 0.126 (in 3 folds),0.404 +/- 0.098 (in 3 folds),0.524,0.332,0.494 +/- 0.090 (in 3 folds),0.347 +/- 0.040 (in 3 folds),...,Unknown,124,8,132,0.060606,False,0.576 +/- 0.000 (in 1 folds),0.578 +/- 0.000 (in 1 folds),0.588 +/- 0.000 (in 1 folds),0.589 +/- 0.000 (in 1 folds)












GeneLocus.BCR TargetObsColumnEnum.age_group_healthy_only
























































































































































































































































































































































































































































































































































































































































































































































































































































































































Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.537 +/- 0.058 (in 3 folds),0.534 +/- 0.056 (in 3 folds),0.626 +/- 0.063 (in 3 folds),0.626 +/- 0.062 (in 3 folds),0.215 +/- 0.030 (in 3 folds),0.066 +/- 0.016 (in 3 folds),0.215,0.053,0.212 +/- 0.028 (in 3 folds),0.066 +/- 0.017 (in 3 folds),...,0.695 +/- 0.000 (in 1 folds),0.212,0.051,0.015,Unknown,130,2,132,0.015152,True
linearsvm_ovr.decision_thresholds_tuned,0.537 +/- 0.058 (in 3 folds),0.534 +/- 0.056 (in 3 folds),0.626 +/- 0.063 (in 3 folds),0.626 +/- 0.062 (in 3 folds),0.349 +/- 0.079 (in 3 folds),0.265 +/- 0.066 (in 3 folds),0.346,0.243,0.344 +/- 0.083 (in 3 folds),0.262 +/- 0.067 (in 3 folds),...,0.695 +/- 0.000 (in 1 folds),0.341,0.239,0.015,Unknown,130,2,132,0.015152,True
lasso_cv,0.533 +/- 0.041 (in 3 folds),0.530 +/- 0.040 (in 3 folds),0.614 +/- 0.045 (in 3 folds),0.614 +/- 0.043 (in 3 folds),0.214 +/- 0.020 (in 3 folds),0.108 +/- 0.038 (in 3 folds),0.213,0.06,0.205 +/- 0.013 (in 3 folds),0.095 +/- 0.031 (in 3 folds),...,,0.205,0.057,0.038,Unknown,127,5,132,0.037879,True
lasso_cv.decision_thresholds_tuned,0.533 +/- 0.041 (in 3 folds),0.530 +/- 0.040 (in 3 folds),0.614 +/- 0.045 (in 3 folds),0.614 +/- 0.043 (in 3 folds),0.288 +/- 0.074 (in 3 folds),0.227 +/- 0.051 (in 3 folds),0.283,0.153,0.275 +/- 0.062 (in 3 folds),0.210 +/- 0.034 (in 3 folds),...,,0.273,0.147,0.038,Unknown,127,5,132,0.037879,True
lasso_multiclass,0.529 +/- 0.030 (in 3 folds),0.523 +/- 0.036 (in 3 folds),0.628 +/- 0.036 (in 3 folds),0.624 +/- 0.041 (in 3 folds),0.241 +/- 0.053 (in 3 folds),0.110 +/- 0.051 (in 3 folds),0.227,0.088,0.188 +/- 0.039 (in 3 folds),0.084 +/- 0.016 (in 3 folds),...,0.651 +/- 0.000 (in 1 folds),0.189,0.077,0.167,Unknown,110,22,132,0.166667,False
lasso_multiclass.decision_thresholds_tuned,0.529 +/- 0.030 (in 3 folds),0.523 +/- 0.036 (in 3 folds),0.628 +/- 0.036 (in 3 folds),0.624 +/- 0.041 (in 3 folds),0.330 +/- 0.028 (in 3 folds),0.267 +/- 0.051 (in 3 folds),0.336,0.22,0.276 +/- 0.113 (in 3 folds),0.201 +/- 0.119 (in 3 folds),...,0.651 +/- 0.000 (in 1 folds),0.28,0.182,0.167,Unknown,110,22,132,0.166667,True
xgboost,0.525 +/- 0.053 (in 3 folds),0.523 +/- 0.049 (in 3 folds),0.584 +/- 0.074 (in 3 folds),0.582 +/- 0.068 (in 3 folds),0.235 +/- 0.011 (in 3 folds),0.007 +/- 0.132 (in 3 folds),0.239,0.092,0.168 +/- 0.107 (in 3 folds),0.052 +/- 0.048 (in 3 folds),...,,0.167,0.059,0.303,Unknown,92,40,132,0.30303,True
xgboost.decision_thresholds_tuned,0.525 +/- 0.053 (in 3 folds),0.523 +/- 0.049 (in 3 folds),0.584 +/- 0.074 (in 3 folds),0.582 +/- 0.068 (in 3 folds),0.256 +/- 0.132 (in 3 folds),0.174 +/- 0.116 (in 3 folds),0.304,0.173,0.215 +/- 0.170 (in 3 folds),0.131 +/- 0.131 (in 3 folds),...,,0.212,0.115,0.303,Unknown,92,40,132,0.30303,True
rf_multiclass,0.517 +/- 0.039 (in 3 folds),0.517 +/- 0.045 (in 3 folds),0.584 +/- 0.019 (in 3 folds),0.585 +/- 0.023 (in 3 folds),0.228 +/- 0.036 (in 3 folds),0.076 +/- 0.018 (in 3 folds),0.229,0.069,0.226 +/- 0.037 (in 3 folds),0.076 +/- 0.018 (in 3 folds),...,0.591 +/- 0.028 (in 2 folds),0.227,0.065,0.008,Unknown,131,1,132,0.007576,True
rf_multiclass.decision_thresholds_tuned,0.517 +/- 0.039 (in 3 folds),0.517 +/- 0.045 (in 3 folds),0.584 +/- 0.019 (in 3 folds),0.585 +/- 0.023 (in 3 folds),0.335 +/- 0.036 (in 3 folds),0.242 +/- 0.060 (in 3 folds),0.336,0.204,0.332 +/- 0.034 (in 3 folds),0.240 +/- 0.060 (in 3 folds),...,0.591 +/- 0.028 (in 2 folds),0.333,0.202,0.008,Unknown,131,1,132,0.007576,False


GeneLocus.BCR TargetObsColumnEnum.age_group_binary_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
xgboost,0.667 +/- 0.110 (in 3 folds),0.667 +/- 0.110 (in 3 folds),0.778 +/- 0.105 (in 3 folds),0.778 +/- 0.105 (in 3 folds),0.679 +/- 0.057 (in 3 folds),0.314 +/- 0.119 (in 3 folds),0.673,0.264,0.513 +/- 0.150 (in 3 folds),0.205 +/- 0.036 (in 3 folds),...,0.657 +/- 0.000 (in 1 folds),0.515,0.168,0.235,Unknown,101,31,132,0.234848,False
xgboost.decision_thresholds_tuned,0.667 +/- 0.110 (in 3 folds),0.667 +/- 0.110 (in 3 folds),0.778 +/- 0.105 (in 3 folds),0.778 +/- 0.105 (in 3 folds),0.655 +/- 0.110 (in 3 folds),0.375 +/- 0.071 (in 3 folds),0.653,0.25,0.496 +/- 0.174 (in 3 folds),0.251 +/- 0.056 (in 3 folds),...,0.657 +/- 0.000 (in 1 folds),0.5,0.164,0.235,Unknown,101,31,132,0.234848,False
rf_multiclass,0.616 +/- 0.156 (in 3 folds),0.616 +/- 0.156 (in 3 folds),0.756 +/- 0.062 (in 3 folds),0.756 +/- 0.062 (in 3 folds),0.674 +/- 0.065 (in 3 folds),0.252 +/- 0.196 (in 3 folds),0.664,0.212,0.554 +/- 0.156 (in 3 folds),0.168 +/- 0.095 (in 3 folds),...,0.720 +/- 0.009 (in 2 folds),0.553,0.153,0.167,Unknown,110,22,132,0.166667,False
rf_multiclass.decision_thresholds_tuned,0.616 +/- 0.156 (in 3 folds),0.616 +/- 0.156 (in 3 folds),0.756 +/- 0.062 (in 3 folds),0.756 +/- 0.062 (in 3 folds),0.698 +/- 0.040 (in 3 folds),0.298 +/- 0.161 (in 3 folds),0.691,0.257,0.577 +/- 0.174 (in 3 folds),0.214 +/- 0.091 (in 3 folds),...,0.720 +/- 0.009 (in 2 folds),0.576,0.179,0.167,Unknown,110,22,132,0.166667,False
lasso_cv,0.608 +/- 0.106 (in 3 folds),0.608 +/- 0.106 (in 3 folds),0.736 +/- 0.129 (in 3 folds),0.736 +/- 0.129 (in 3 folds),0.538 +/- 0.116 (in 3 folds),0.115 +/- 0.099 (in 3 folds),0.565,0.11,0.367 +/- 0.190 (in 3 folds),0.080 +/- 0.043 (in 3 folds),...,,0.364,0.061,0.356,Unknown,85,47,132,0.356061,False
lasso_cv.decision_thresholds_tuned,0.608 +/- 0.106 (in 3 folds),0.608 +/- 0.106 (in 3 folds),0.736 +/- 0.129 (in 3 folds),0.736 +/- 0.129 (in 3 folds),0.614 +/- 0.098 (in 3 folds),0.259 +/- 0.226 (in 3 folds),0.624,0.227,0.403 +/- 0.180 (in 3 folds),0.166 +/- 0.174 (in 3 folds),...,,0.402,0.126,0.356,Unknown,85,47,132,0.356061,False
lasso_multiclass,0.597 +/- 0.115 (in 3 folds),0.597 +/- 0.115 (in 3 folds),0.749 +/- 0.105 (in 3 folds),0.749 +/- 0.105 (in 3 folds),0.640 +/- 0.051 (in 3 folds),0.233 +/- 0.106 (in 3 folds),0.64,0.206,0.550 +/- 0.084 (in 3 folds),0.175 +/- 0.055 (in 3 folds),...,0.637 +/- 0.000 (in 1 folds),0.553,0.154,0.136,Unknown,114,18,132,0.136364,False
lasso_multiclass.decision_thresholds_tuned,0.597 +/- 0.115 (in 3 folds),0.597 +/- 0.115 (in 3 folds),0.749 +/- 0.105 (in 3 folds),0.749 +/- 0.105 (in 3 folds),0.654 +/- 0.053 (in 3 folds),0.311 +/- 0.059 (in 3 folds),0.658,0.236,0.564 +/- 0.106 (in 3 folds),0.240 +/- 0.003 (in 3 folds),...,0.637 +/- 0.000 (in 1 folds),0.568,0.175,0.136,Unknown,114,18,132,0.136364,False
linearsvm_ovr,0.596 +/- 0.117 (in 3 folds),0.596 +/- 0.117 (in 3 folds),0.747 +/- 0.108 (in 3 folds),0.747 +/- 0.108 (in 3 folds),0.647 +/- 0.051 (in 3 folds),0.249 +/- 0.087 (in 3 folds),0.649,0.221,0.557 +/- 0.094 (in 3 folds),0.191 +/- 0.047 (in 3 folds),...,0.631 +/- 0.000 (in 1 folds),0.561,0.164,0.136,Unknown,114,18,132,0.136364,False
linearsvm_ovr.decision_thresholds_tuned,0.596 +/- 0.117 (in 3 folds),0.596 +/- 0.117 (in 3 folds),0.747 +/- 0.108 (in 3 folds),0.747 +/- 0.108 (in 3 folds),0.654 +/- 0.053 (in 3 folds),0.311 +/- 0.059 (in 3 folds),0.658,0.236,0.564 +/- 0.106 (in 3 folds),0.240 +/- 0.003 (in 3 folds),...,0.631 +/- 0.000 (in 1 folds),0.568,0.175,0.136,Unknown,114,18,132,0.136364,False


GeneLocus.BCR TargetObsColumnEnum.sex_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
rf_multiclass,0.560 +/- 0.029 (in 3 folds),0.560 +/- 0.029 (in 3 folds),0.568 +/- 0.192 (in 3 folds),0.568 +/- 0.192 (in 3 folds),0.537 +/- 0.059 (in 3 folds),0.194 +/- 0.069 (in 3 folds),0.541,0.078,0.452 +/- 0.130 (in 3 folds),0.128 +/- 0.053 (in 3 folds),0.169 +/- 0.151 (in 3 folds),0.447,0.048,0.174,Unknown,109,23,132,0.174242,False
rf_multiclass.decision_thresholds_tuned,0.560 +/- 0.029 (in 3 folds),0.560 +/- 0.029 (in 3 folds),0.568 +/- 0.192 (in 3 folds),0.568 +/- 0.192 (in 3 folds),0.592 +/- 0.106 (in 3 folds),0.219 +/- 0.068 (in 3 folds),0.587,0.203,0.489 +/- 0.109 (in 3 folds),0.128 +/- 0.088 (in 3 folds),0.169 +/- 0.151 (in 3 folds),0.485,0.105,0.174,Unknown,109,23,132,0.174242,False
elasticnet_cv,0.556 +/- 0.069 (in 3 folds),0.556 +/- 0.069 (in 3 folds),0.579 +/- 0.179 (in 3 folds),0.579 +/- 0.179 (in 3 folds),0.537 +/- 0.047 (in 3 folds),0.191 +/- 0.099 (in 3 folds),0.541,0.08,0.451 +/- 0.118 (in 3 folds),0.123 +/- 0.047 (in 3 folds),0.169 +/- 0.151 (in 3 folds),0.447,0.054,0.174,Unknown,109,23,132,0.174242,False
elasticnet_cv.decision_thresholds_tuned,0.556 +/- 0.069 (in 3 folds),0.556 +/- 0.069 (in 3 folds),0.579 +/- 0.179 (in 3 folds),0.579 +/- 0.179 (in 3 folds),0.640 +/- 0.096 (in 3 folds),0.307 +/- 0.073 (in 3 folds),0.633,0.316,0.525 +/- 0.075 (in 3 folds),0.177 +/- 0.053 (in 3 folds),0.169 +/- 0.151 (in 3 folds),0.523,0.182,0.174,Unknown,109,23,132,0.174242,False
linearsvm_ovr,0.555 +/- 0.063 (in 3 folds),0.555 +/- 0.063 (in 3 folds),0.537 +/- 0.157 (in 3 folds),0.537 +/- 0.157 (in 3 folds),0.580 +/- 0.009 (in 3 folds),0.173 +/- 0.064 (in 3 folds),0.581,0.15,0.546 +/- 0.041 (in 3 folds),0.156 +/- 0.062 (in 3 folds),0.059 +/- 0.062 (in 3 folds),0.545,0.134,0.061,Unknown,124,8,132,0.060606,False
linearsvm_ovr.decision_thresholds_tuned,0.555 +/- 0.063 (in 3 folds),0.555 +/- 0.063 (in 3 folds),0.537 +/- 0.157 (in 3 folds),0.537 +/- 0.157 (in 3 folds),0.661 +/- 0.063 (in 3 folds),0.238 +/- 0.055 (in 3 folds),0.661,0.315,0.620 +/- 0.031 (in 3 folds),0.203 +/- 0.067 (in 3 folds),0.059 +/- 0.062 (in 3 folds),0.621,0.278,0.061,Unknown,124,8,132,0.060606,False
lasso_multiclass,0.554 +/- 0.058 (in 3 folds),0.554 +/- 0.058 (in 3 folds),0.536 +/- 0.148 (in 3 folds),0.536 +/- 0.148 (in 3 folds),0.556 +/- 0.027 (in 3 folds),0.123 +/- 0.099 (in 3 folds),0.556,0.098,0.523 +/- 0.029 (in 3 folds),0.110 +/- 0.084 (in 3 folds),0.059 +/- 0.062 (in 3 folds),0.523,0.087,0.061,Unknown,124,8,132,0.060606,False
lasso_multiclass.decision_thresholds_tuned,0.554 +/- 0.058 (in 3 folds),0.554 +/- 0.058 (in 3 folds),0.536 +/- 0.148 (in 3 folds),0.536 +/- 0.148 (in 3 folds),0.662 +/- 0.055 (in 3 folds),0.257 +/- 0.030 (in 3 folds),0.661,0.327,0.621 +/- 0.010 (in 3 folds),0.221 +/- 0.063 (in 3 folds),0.059 +/- 0.062 (in 3 folds),0.621,0.284,0.061,Unknown,124,8,132,0.060606,False
lasso_cv,0.547 +/- 0.084 (in 3 folds),0.547 +/- 0.084 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.521 +/- 0.130 (in 3 folds),0.240 +/- 0.079 (in 3 folds),0.49,-0.014,0.376 +/- 0.087 (in 3 folds),0.147 +/- 0.021 (in 3 folds),0.238 +/- 0.267 (in 3 folds),0.379,0.002,0.227,Unknown,102,30,132,0.227273,False
lasso_cv.decision_thresholds_tuned,0.547 +/- 0.084 (in 3 folds),0.547 +/- 0.084 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.624 +/- 0.068 (in 3 folds),0.261 +/- 0.044 (in 3 folds),0.627,0.271,0.478 +/- 0.191 (in 3 folds),0.159 +/- 0.032 (in 3 folds),0.238 +/- 0.267 (in 3 folds),0.485,0.158,0.227,Unknown,102,30,132,0.227273,False


2022-12-31 05:38:44,764 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.0.test.h5ad -> /srv/scratch/maximz/cache/d23bdbcb1cb8d1c3007da595727fbbab8cc86779ab8967868314f2da.0.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2022-12-31 06:20:59,725 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 66 specimens




2022-12-31 06:34:04,351 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 53 specimens




2022-12-31 06:49:39,230 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 53 specimens




2022-12-31 07:05:41,906 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 20 specimens (485965 rows)


2022-12-31 07:06:05,456 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 75 specimens




2022-12-31 07:17:04,920 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 2 specimens (35185 rows)


2022-12-31 07:17:26,474 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 84 specimens




2022-12-31 07:29:11,499 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 2 specimens (35185 rows)


2022-12-31 07:29:36,885 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 84 specimens




2022-12-31 07:40:49,548 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtered to specimens with defined sex column - removed 1 specimens (11616 rows)


2022-12-31 07:41:10,797 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 85 specimens


2022-12-31 07:50:31,110 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.1.test.h5ad -> /srv/scratch/maximz/cache/ed1f2608e168c24c508b6bfbbe3a18ba1a4680e5c010e34cd184cae6.1.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2022-12-31 08:27:30,413 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 67 specimens




2022-12-31 08:37:59,713 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 56 specimens




2022-12-31 08:50:41,587 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 55 specimens




2022-12-31 09:04:53,938 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 23 specimens (507703 rows)


2022-12-31 09:05:08,507 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 82 specimens




2022-12-31 09:15:14,795 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 3 specimens (42791 rows)


2022-12-31 09:15:35,067 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 87 specimens




2022-12-31 09:24:16,390 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 3 specimens (42791 rows)


2022-12-31 09:24:34,727 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 87 specimens




2022-12-31 09:33:18,284 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtered to specimens with defined sex column - removed 2 specimens (35834 rows)


2022-12-31 09:33:36,434 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 88 specimens


2022-12-31 09:40:57,150 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.2.test.h5ad -> /srv/scratch/maximz/cache/83dcd409138574af7b7b712ce14967e926c14170bff7801b141edb49.2.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2022-12-31 10:18:26,674 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 63 specimens




2022-12-31 10:29:20,845 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 52 specimens




2022-12-31 10:43:11,936 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 53 specimens




2022-12-31 10:56:51,820 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 14 specimens (363854 rows)


2022-12-31 10:57:13,830 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 74 specimens




2022-12-31 11:07:13,712 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 2 specimens (10728 rows)


2022-12-31 11:07:35,208 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 83 specimens




2022-12-31 11:17:42,651 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 2 specimens (10728 rows)


2022-12-31 11:18:03,803 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 83 specimens




2022-12-31 11:27:46,493 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 84 specimens


GeneLocus.BCR TargetObsColumnEnum.disease --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/disease


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,...,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.929 +/- 0.007 (in 3 folds),0.936 +/- 0.007 (in 3 folds),0.931 +/- 0.008 (in 3 folds),0.939 +/- 0.008 (in 3 folds),0.766 +/- 0.010 (in 3 folds),0.655 +/- 0.012 (in 3 folds),0.765,0.654,disease.separate_past_exposures,0.754 +/- 0.015 (in 3 folds),...,0.754,0.64,0.015,Unknown,disease.separate_past_exposures,473,7,480,0.014583,False
linearsvm_ovr.decision_thresholds_tuned,0.929 +/- 0.007 (in 3 folds),0.936 +/- 0.007 (in 3 folds),0.931 +/- 0.008 (in 3 folds),0.939 +/- 0.008 (in 3 folds),0.759 +/- 0.013 (in 3 folds),0.651 +/- 0.016 (in 3 folds),0.759,0.647,disease.separate_past_exposures,0.748 +/- 0.006 (in 3 folds),...,0.748,0.634,0.015,Unknown,disease.separate_past_exposures,473,7,480,0.014583,False
lasso_multiclass,0.926 +/- 0.009 (in 3 folds),0.933 +/- 0.010 (in 3 folds),0.927 +/- 0.014 (in 3 folds),0.935 +/- 0.014 (in 3 folds),0.761 +/- 0.010 (in 3 folds),0.650 +/- 0.022 (in 3 folds),0.761,0.649,disease.separate_past_exposures,0.744 +/- 0.031 (in 3 folds),...,0.744,0.628,0.023,Unknown,disease.separate_past_exposures,469,11,480,0.022917,False
lasso_multiclass.decision_thresholds_tuned,0.926 +/- 0.009 (in 3 folds),0.933 +/- 0.010 (in 3 folds),0.927 +/- 0.014 (in 3 folds),0.935 +/- 0.014 (in 3 folds),0.756 +/- 0.045 (in 3 folds),0.646 +/- 0.060 (in 3 folds),0.757,0.642,disease.separate_past_exposures,0.740 +/- 0.065 (in 3 folds),...,0.74,0.62,0.023,Unknown,disease.separate_past_exposures,469,11,480,0.022917,False
lasso_cv,0.909 +/- 0.014 (in 3 folds),0.918 +/- 0.015 (in 3 folds),0.914 +/- 0.008 (in 3 folds),0.923 +/- 0.008 (in 3 folds),0.544 +/- 0.017 (in 3 folds),0.317 +/- 0.047 (in 3 folds),0.543,0.318,disease.separate_past_exposures,0.523 +/- 0.016 (in 3 folds),...,0.523,0.261,0.037,Unknown,disease.separate_past_exposures,462,18,480,0.0375,False
lasso_cv.decision_thresholds_tuned,0.909 +/- 0.014 (in 3 folds),0.918 +/- 0.015 (in 3 folds),0.914 +/- 0.008 (in 3 folds),0.923 +/- 0.008 (in 3 folds),0.758 +/- 0.014 (in 3 folds),0.644 +/- 0.024 (in 3 folds),0.758,0.643,disease.separate_past_exposures,0.729 +/- 0.033 (in 3 folds),...,0.729,0.605,0.037,Unknown,disease.separate_past_exposures,462,18,480,0.0375,False
elasticnet_cv,0.909 +/- 0.011 (in 3 folds),0.916 +/- 0.011 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.610 +/- 0.132 (in 3 folds),0.390 +/- 0.278 (in 3 folds),0.612,0.44,disease.separate_past_exposures,0.604 +/- 0.141 (in 3 folds),...,0.604,0.424,0.013,Unknown,disease.separate_past_exposures,474,6,480,0.0125,False
elasticnet_cv.decision_thresholds_tuned,0.909 +/- 0.011 (in 3 folds),0.916 +/- 0.011 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.734 +/- 0.048 (in 3 folds),0.625 +/- 0.051 (in 3 folds),0.734,0.615,disease.separate_past_exposures,0.724 +/- 0.047 (in 3 folds),...,0.725,0.603,0.013,Unknown,disease.separate_past_exposures,474,6,480,0.0125,False
ridge_cv,0.907 +/- 0.010 (in 3 folds),0.917 +/- 0.011 (in 3 folds),0.914 +/- 0.006 (in 3 folds),0.924 +/- 0.006 (in 3 folds),0.576 +/- 0.065 (in 3 folds),0.371 +/- 0.124 (in 3 folds),0.577,0.383,disease.separate_past_exposures,0.572 +/- 0.068 (in 3 folds),...,0.573,0.374,0.006,Unknown,disease.separate_past_exposures,477,3,480,0.00625,False
ridge_cv.decision_thresholds_tuned,0.907 +/- 0.010 (in 3 folds),0.917 +/- 0.011 (in 3 folds),0.914 +/- 0.006 (in 3 folds),0.924 +/- 0.006 (in 3 folds),0.761 +/- 0.027 (in 3 folds),0.654 +/- 0.048 (in 3 folds),0.761,0.654,disease.separate_past_exposures,0.756 +/- 0.031 (in 3 folds),...,0.756,0.647,0.006,Unknown,disease.separate_past_exposures,477,3,480,0.00625,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/disease/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.disease_all_demographics_present --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/disease_all_demographics_present


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,...,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
lasso_multiclass,0.920 +/- 0.020 (in 3 folds),0.927 +/- 0.022 (in 3 folds),0.924 +/- 0.014 (in 3 folds),0.932 +/- 0.015 (in 3 folds),0.730 +/- 0.051 (in 3 folds),0.611 +/- 0.069 (in 3 folds),0.729,0.609,disease.separate_past_exposures,0.719 +/- 0.046 (in 3 folds),...,disease.separate_past_exposures,414,6,420,0.014286,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.920 +/- 0.020 (in 3 folds),0.927 +/- 0.022 (in 3 folds),0.924 +/- 0.014 (in 3 folds),0.932 +/- 0.015 (in 3 folds),0.698 +/- 0.066 (in 3 folds),0.596 +/- 0.069 (in 3 folds),0.698,0.573,disease.separate_past_exposures,0.688 +/- 0.066 (in 3 folds),...,disease.separate_past_exposures,414,6,420,0.014286,False,,,,
linearsvm_ovr,0.915 +/- 0.017 (in 3 folds),0.923 +/- 0.019 (in 3 folds),0.921 +/- 0.013 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.733 +/- 0.029 (in 3 folds),0.605 +/- 0.038 (in 3 folds),0.733,0.602,disease.separate_past_exposures,0.724 +/- 0.023 (in 3 folds),...,disease.separate_past_exposures,415,5,420,0.011905,False,0.915 +/- 0.000 (in 1 folds),0.924 +/- 0.000 (in 1 folds),0.926 +/- 0.000 (in 1 folds),0.935 +/- 0.000 (in 1 folds)
linearsvm_ovr.decision_thresholds_tuned,0.915 +/- 0.017 (in 3 folds),0.923 +/- 0.019 (in 3 folds),0.921 +/- 0.013 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.670 +/- 0.053 (in 3 folds),0.559 +/- 0.057 (in 3 folds),0.67,0.527,disease.separate_past_exposures,0.662 +/- 0.052 (in 3 folds),...,disease.separate_past_exposures,415,5,420,0.011905,False,0.915 +/- 0.000 (in 1 folds),0.924 +/- 0.000 (in 1 folds),0.926 +/- 0.000 (in 1 folds),0.935 +/- 0.000 (in 1 folds)
ridge_cv,0.914 +/- 0.031 (in 3 folds),0.923 +/- 0.031 (in 3 folds),0.924 +/- 0.015 (in 3 folds),0.933 +/- 0.015 (in 3 folds),0.527 +/- 0.160 (in 3 folds),0.192 +/- 0.333 (in 3 folds),0.531,0.302,disease.separate_past_exposures,0.502 +/- 0.174 (in 3 folds),...,disease.separate_past_exposures,397,23,420,0.054762,False,,,,
ridge_cv.decision_thresholds_tuned,0.914 +/- 0.031 (in 3 folds),0.923 +/- 0.031 (in 3 folds),0.924 +/- 0.015 (in 3 folds),0.933 +/- 0.015 (in 3 folds),0.424 +/- 0.341 (in 3 folds),0.218 +/- 0.378 (in 3 folds),0.423,0.197,disease.separate_past_exposures,0.401 +/- 0.335 (in 3 folds),...,disease.separate_past_exposures,397,23,420,0.054762,False,,,,
elasticnet_cv,0.907 +/- 0.015 (in 3 folds),0.915 +/- 0.016 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.925 +/- 0.008 (in 3 folds),0.637 +/- 0.132 (in 3 folds),0.432 +/- 0.294 (in 3 folds),0.638,0.481,disease.separate_past_exposures,0.629 +/- 0.141 (in 3 folds),...,disease.separate_past_exposures,414,6,420,0.014286,False,0.921 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds),0.919 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds)
elasticnet_cv.decision_thresholds_tuned,0.907 +/- 0.015 (in 3 folds),0.915 +/- 0.016 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.925 +/- 0.008 (in 3 folds),0.727 +/- 0.036 (in 3 folds),0.609 +/- 0.065 (in 3 folds),0.727,0.594,disease.separate_past_exposures,0.717 +/- 0.042 (in 3 folds),...,disease.separate_past_exposures,414,6,420,0.014286,False,0.921 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds),0.919 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds)
xgboost,0.904 +/- 0.005 (in 3 folds),0.910 +/- 0.007 (in 3 folds),0.910 +/- 0.003 (in 3 folds),0.920 +/- 0.003 (in 3 folds),0.756 +/- 0.019 (in 3 folds),0.642 +/- 0.029 (in 3 folds),0.757,0.64,disease.separate_past_exposures,0.733 +/- 0.036 (in 3 folds),...,disease.separate_past_exposures,407,13,420,0.030952,False,0.903 +/- 0.000 (in 1 folds),0.910 +/- 0.000 (in 1 folds),0.914 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds)
xgboost.decision_thresholds_tuned,0.904 +/- 0.005 (in 3 folds),0.910 +/- 0.007 (in 3 folds),0.910 +/- 0.003 (in 3 folds),0.920 +/- 0.003 (in 3 folds),0.737 +/- 0.024 (in 3 folds),0.613 +/- 0.029 (in 3 folds),0.737,0.613,disease.separate_past_exposures,0.714 +/- 0.031 (in 3 folds),...,disease.separate_past_exposures,407,13,420,0.030952,False,0.903 +/- 0.000 (in 1 folds),0.910 +/- 0.000 (in 1 folds),0.914 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds)


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/disease_all_demographics_present/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.covid_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/covid_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,...,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.991 +/- 0.007 (in 3 folds),0.991 +/- 0.007 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.776 +/- 0.010 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.776,0.0,disease.separate_past_exposures,0.757 +/- 0.010 (in 3 folds),...,0.757,-0.015,0.025,Unknown,disease.separate_past_exposures,277,7,284,0.024648,True
ridge_cv.decision_thresholds_tuned,0.991 +/- 0.007 (in 3 folds),0.991 +/- 0.007 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.776 +/- 0.010 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.776,0.0,disease.separate_past_exposures,0.757 +/- 0.010 (in 3 folds),...,0.757,-0.015,0.025,Unknown,disease.separate_past_exposures,277,7,284,0.024648,True
linearsvm_ovr,0.988 +/- 0.005 (in 3 folds),0.988 +/- 0.005 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.946 +/- 0.023 (in 3 folds),0.849 +/- 0.067 (in 3 folds),0.946,0.85,disease.separate_past_exposures,0.933 +/- 0.033 (in 3 folds),...,0.933,0.819,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
linearsvm_ovr.decision_thresholds_tuned,0.988 +/- 0.005 (in 3 folds),0.988 +/- 0.005 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.953 +/- 0.036 (in 3 folds),0.862 +/- 0.110 (in 3 folds),0.954,0.865,disease.separate_past_exposures,0.940 +/- 0.041 (in 3 folds),...,0.94,0.831,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
lasso_cv,0.988 +/- 0.003 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.868 +/- 0.025 (in 3 folds),0.580 +/- 0.109 (in 3 folds),0.868,0.587,disease.separate_past_exposures,0.856 +/- 0.032 (in 3 folds),...,0.856,0.542,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
lasso_cv.decision_thresholds_tuned,0.988 +/- 0.003 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.940 +/- 0.042 (in 3 folds),0.843 +/- 0.091 (in 3 folds),0.939,0.827,disease.separate_past_exposures,0.926 +/- 0.031 (in 3 folds),...,0.926,0.796,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
lasso_multiclass,0.986 +/- 0.010 (in 3 folds),0.986 +/- 0.010 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.949 +/- 0.042 (in 3 folds),0.852 +/- 0.126 (in 3 folds),0.95,0.855,disease.separate_past_exposures,0.936 +/- 0.047 (in 3 folds),...,0.937,0.822,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
lasso_multiclass.decision_thresholds_tuned,0.986 +/- 0.010 (in 3 folds),0.986 +/- 0.010 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.924 +/- 0.040 (in 3 folds),0.797 +/- 0.101 (in 3 folds),0.925,0.793,disease.separate_past_exposures,0.912 +/- 0.050 (in 3 folds),...,0.912,0.764,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
elasticnet_cv,0.985 +/- 0.006 (in 3 folds),0.985 +/- 0.006 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.801 +/- 0.020 (in 3 folds),0.230 +/- 0.048 (in 3 folds),0.801,0.233,disease.separate_past_exposures,0.778 +/- 0.009 (in 3 folds),...,0.778,0.177,0.028,Unknown,disease.separate_past_exposures,276,8,284,0.028169,False
elasticnet_cv.decision_thresholds_tuned,0.985 +/- 0.006 (in 3 folds),0.985 +/- 0.006 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.945 +/- 0.024 (in 3 folds),0.833 +/- 0.081 (in 3 folds),0.946,0.837,disease.separate_past_exposures,0.919 +/- 0.053 (in 3 folds),...,0.919,0.775,0.028,Unknown,disease.separate_past_exposures,276,8,284,0.028169,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/covid_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.hiv_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/hiv_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,...,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.981 +/- 0.013 (in 3 folds),0.981 +/- 0.013 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.805 +/- 0.088 (in 3 folds),0.531 +/- 0.226 (in 3 folds),0.805,0.545,disease.separate_past_exposures,0.777 +/- 0.077 (in 3 folds),...,disease.separate_past_exposures,308,11,319,0.034483,False,,,,
elasticnet_cv.decision_thresholds_tuned,0.981 +/- 0.013 (in 3 folds),0.981 +/- 0.013 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.932 +/- 0.018 (in 3 folds),0.850 +/- 0.036 (in 3 folds),0.932,0.847,disease.separate_past_exposures,0.900 +/- 0.023 (in 3 folds),...,disease.separate_past_exposures,308,11,319,0.034483,False,,,,
ridge_cv,0.981 +/- 0.007 (in 3 folds),0.981 +/- 0.007 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.690 +/- 0.004 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.69,0.0,disease.separate_past_exposures,0.683 +/- 0.010 (in 3 folds),...,disease.separate_past_exposures,316,3,319,0.009404,True,0.981 +/- 0.000 (in 1 folds),0.981 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
ridge_cv.decision_thresholds_tuned,0.981 +/- 0.007 (in 3 folds),0.981 +/- 0.007 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.690 +/- 0.004 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.69,0.0,disease.separate_past_exposures,0.683 +/- 0.010 (in 3 folds),...,disease.separate_past_exposures,316,3,319,0.009404,True,0.981 +/- 0.000 (in 1 folds),0.981 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
lasso_cv,0.979 +/- 0.014 (in 3 folds),0.979 +/- 0.014 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.878 +/- 0.023 (in 3 folds),0.718 +/- 0.053 (in 3 folds),0.878,0.716,disease.separate_past_exposures,0.856 +/- 0.022 (in 3 folds),...,disease.separate_past_exposures,311,8,319,0.025078,False,,,,
lasso_cv.decision_thresholds_tuned,0.979 +/- 0.014 (in 3 folds),0.979 +/- 0.014 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.907 +/- 0.026 (in 3 folds),0.790 +/- 0.071 (in 3 folds),0.907,0.786,disease.separate_past_exposures,0.884 +/- 0.020 (in 3 folds),...,disease.separate_past_exposures,311,8,319,0.025078,False,,,,
linearsvm_ovr,0.978 +/- 0.010 (in 3 folds),0.978 +/- 0.010 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.911 +/- 0.029 (in 3 folds),0.789 +/- 0.070 (in 3 folds),0.911,0.789,disease.separate_past_exposures,0.900 +/- 0.028 (in 3 folds),...,disease.separate_past_exposures,315,4,319,0.012539,False,0.982 +/- 0.000 (in 1 folds),0.982 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
linearsvm_ovr.decision_thresholds_tuned,0.978 +/- 0.010 (in 3 folds),0.978 +/- 0.010 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.918 +/- 0.028 (in 3 folds),0.807 +/- 0.071 (in 3 folds),0.917,0.805,disease.separate_past_exposures,0.906 +/- 0.031 (in 3 folds),...,disease.separate_past_exposures,315,4,319,0.012539,False,0.982 +/- 0.000 (in 1 folds),0.982 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
lasso_multiclass,0.977 +/- 0.013 (in 3 folds),0.977 +/- 0.013 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.908 +/- 0.026 (in 3 folds),0.782 +/- 0.064 (in 3 folds),0.907,0.781,disease.separate_past_exposures,0.890 +/- 0.025 (in 3 folds),...,disease.separate_past_exposures,313,6,319,0.018809,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.977 +/- 0.013 (in 3 folds),0.977 +/- 0.013 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.917 +/- 0.035 (in 3 folds),0.810 +/- 0.088 (in 3 folds),0.917,0.805,disease.separate_past_exposures,0.900 +/- 0.034 (in 3 folds),...,disease.separate_past_exposures,313,6,319,0.018809,False,,,,


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/hiv_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.lupus_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/lupus_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,...,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.863 +/- 0.042 (in 3 folds),0.863 +/- 0.042 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.769 +/- 0.010 (in 3 folds),0.442 +/- 0.066 (in 3 folds),0.769,0.424,disease.separate_past_exposures,0.575 +/- 0.123 (in 3 folds),...,0.574,0.232,0.254,Unknown,disease.separate_past_exposures,238,81,319,0.253918,False
elasticnet_cv.decision_thresholds_tuned,0.863 +/- 0.042 (in 3 folds),0.863 +/- 0.042 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.804 +/- 0.046 (in 3 folds),0.563 +/- 0.089 (in 3 folds),0.807,0.549,disease.separate_past_exposures,0.604 +/- 0.142 (in 3 folds),...,0.602,0.338,0.254,Unknown,disease.separate_past_exposures,238,81,319,0.253918,False
lasso_cv,0.847 +/- 0.048 (in 3 folds),0.847 +/- 0.048 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.774 +/- 0.026 (in 3 folds),0.457 +/- 0.062 (in 3 folds),0.772,0.421,disease.separate_past_exposures,0.681 +/- 0.077 (in 3 folds),...,0.68,0.292,0.119,Unknown,disease.separate_past_exposures,281,38,319,0.119122,False
lasso_cv.decision_thresholds_tuned,0.847 +/- 0.048 (in 3 folds),0.847 +/- 0.048 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.811 +/- 0.038 (in 3 folds),0.536 +/- 0.099 (in 3 folds),0.808,0.53,disease.separate_past_exposures,0.712 +/- 0.060 (in 3 folds),...,0.712,0.401,0.119,Unknown,disease.separate_past_exposures,281,38,319,0.119122,False
linearsvm_ovr,0.837 +/- 0.002 (in 3 folds),0.837 +/- 0.002 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.776 +/- 0.023 (in 3 folds),0.457 +/- 0.058 (in 3 folds),0.776,0.455,disease.separate_past_exposures,0.758 +/- 0.017 (in 3 folds),...,0.759,0.435,0.022,Unknown,disease.separate_past_exposures,312,7,319,0.021944,False
linearsvm_ovr.decision_thresholds_tuned,0.837 +/- 0.002 (in 3 folds),0.837 +/- 0.002 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.776 +/- 0.023 (in 3 folds),0.449 +/- 0.050 (in 3 folds),0.776,0.444,disease.separate_past_exposures,0.758 +/- 0.017 (in 3 folds),...,0.759,0.424,0.022,Unknown,disease.separate_past_exposures,312,7,319,0.021944,False
lasso_multiclass,0.832 +/- 0.008 (in 3 folds),0.832 +/- 0.008 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.776 +/- 0.015 (in 3 folds),0.457 +/- 0.034 (in 3 folds),0.776,0.455,disease.separate_past_exposures,0.758 +/- 0.010 (in 3 folds),...,0.759,0.435,0.022,Unknown,disease.separate_past_exposures,312,7,319,0.021944,False
lasso_multiclass.decision_thresholds_tuned,0.832 +/- 0.008 (in 3 folds),0.832 +/- 0.008 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.741 +/- 0.070 (in 3 folds),0.461 +/- 0.017 (in 3 folds),0.74,0.429,disease.separate_past_exposures,0.724 +/- 0.068 (in 3 folds),...,0.724,0.411,0.022,Unknown,disease.separate_past_exposures,312,7,319,0.021944,False
xgboost,0.825 +/- 0.057 (in 3 folds),0.825 +/- 0.057 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.764 +/- 0.018 (in 3 folds),0.437 +/- 0.059 (in 3 folds),0.762,0.435,disease.separate_past_exposures,0.684 +/- 0.079 (in 3 folds),...,0.683,0.348,0.103,Unknown,disease.separate_past_exposures,286,33,319,0.103448,False
xgboost.decision_thresholds_tuned,0.825 +/- 0.057 (in 3 folds),0.825 +/- 0.057 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.788 +/- 0.058 (in 3 folds),0.486 +/- 0.143 (in 3 folds),0.783,0.474,disease.separate_past_exposures,0.703 +/- 0.047 (in 3 folds),...,0.702,0.375,0.103,Unknown,disease.separate_past_exposures,286,33,319,0.103448,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/lupus_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.ethnicity_condensed_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/ethnicity_condensed_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.639 +/- 0.040 (in 3 folds),0.664 +/- 0.060 (in 3 folds),0.660 +/- 0.035 (in 3 folds),0.682 +/- 0.056 (in 3 folds),0.597 +/- 0.074 (in 3 folds),0.132 +/- 0.122 (in 3 folds),0.601,0.174,0.540 +/- 0.080 (in 3 folds),0.099 +/- 0.103 (in 3 folds),...,Unknown,173,18,191,0.094241,True,,,,
elasticnet_cv.decision_thresholds_tuned,0.639 +/- 0.040 (in 3 folds),0.664 +/- 0.060 (in 3 folds),0.660 +/- 0.035 (in 3 folds),0.682 +/- 0.056 (in 3 folds),0.519 +/- 0.101 (in 3 folds),0.261 +/- 0.044 (in 3 folds),0.52,0.216,0.471 +/- 0.111 (in 3 folds),0.220 +/- 0.047 (in 3 folds),...,Unknown,173,18,191,0.094241,False,,,,
lasso_cv,0.618 +/- 0.052 (in 3 folds),0.636 +/- 0.091 (in 3 folds),0.635 +/- 0.038 (in 3 folds),0.649 +/- 0.073 (in 3 folds),0.597 +/- 0.103 (in 3 folds),0.163 +/- 0.166 (in 3 folds),0.602,0.191,0.550 +/- 0.113 (in 3 folds),0.111 +/- 0.113 (in 3 folds),...,Unknown,176,15,191,0.078534,True,,,,
lasso_cv.decision_thresholds_tuned,0.618 +/- 0.052 (in 3 folds),0.636 +/- 0.091 (in 3 folds),0.635 +/- 0.038 (in 3 folds),0.649 +/- 0.073 (in 3 folds),0.499 +/- 0.145 (in 3 folds),0.219 +/- 0.115 (in 3 folds),0.494,0.204,0.456 +/- 0.127 (in 3 folds),0.181 +/- 0.082 (in 3 folds),...,Unknown,176,15,191,0.078534,False,,,,
rf_multiclass,0.612 +/- 0.066 (in 3 folds),0.620 +/- 0.073 (in 3 folds),0.634 +/- 0.077 (in 3 folds),0.641 +/- 0.108 (in 3 folds),0.568 +/- 0.078 (in 3 folds),0.165 +/- 0.172 (in 3 folds),0.571,0.143,0.547 +/- 0.062 (in 3 folds),0.153 +/- 0.158 (in 3 folds),...,Unknown,184,7,191,0.036649,True,0.688 +/- 0.000 (in 1 folds),0.702 +/- 0.000 (in 1 folds),0.722 +/- 0.000 (in 1 folds),0.764 +/- 0.000 (in 1 folds)
rf_multiclass.decision_thresholds_tuned,0.612 +/- 0.066 (in 3 folds),0.620 +/- 0.073 (in 3 folds),0.634 +/- 0.077 (in 3 folds),0.641 +/- 0.108 (in 3 folds),0.619 +/- 0.027 (in 3 folds),0.282 +/- 0.043 (in 3 folds),0.62,0.253,0.597 +/- 0.019 (in 3 folds),0.265 +/- 0.059 (in 3 folds),...,Unknown,184,7,191,0.036649,True,0.688 +/- 0.000 (in 1 folds),0.702 +/- 0.000 (in 1 folds),0.722 +/- 0.000 (in 1 folds),0.764 +/- 0.000 (in 1 folds)
ridge_cv,0.586 +/- 0.076 (in 3 folds),0.603 +/- 0.092 (in 3 folds),0.605 +/- 0.094 (in 3 folds),0.621 +/- 0.105 (in 3 folds),0.569 +/- 0.076 (in 3 folds),-0.022 +/- 0.037 (in 3 folds),0.572,-0.045,0.514 +/- 0.077 (in 3 folds),0.015 +/- 0.023 (in 3 folds),...,Unknown,173,18,191,0.094241,True,,,,
ridge_cv.decision_thresholds_tuned,0.586 +/- 0.076 (in 3 folds),0.603 +/- 0.092 (in 3 folds),0.605 +/- 0.094 (in 3 folds),0.621 +/- 0.105 (in 3 folds),0.356 +/- 0.244 (in 3 folds),0.044 +/- 0.077 (in 3 folds),0.358,0.084,0.319 +/- 0.217 (in 3 folds),0.004 +/- 0.098 (in 3 folds),...,Unknown,173,18,191,0.094241,True,,,,
xgboost,0.571 +/- 0.025 (in 3 folds),0.556 +/- 0.031 (in 3 folds),0.623 +/- 0.023 (in 3 folds),0.624 +/- 0.046 (in 3 folds),0.563 +/- 0.084 (in 3 folds),0.182 +/- 0.139 (in 3 folds),0.565,0.169,0.541 +/- 0.066 (in 3 folds),0.172 +/- 0.130 (in 3 folds),...,Unknown,184,7,191,0.036649,False,0.596 +/- 0.000 (in 1 folds),0.592 +/- 0.000 (in 1 folds),0.649 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds)
xgboost.decision_thresholds_tuned,0.571 +/- 0.025 (in 3 folds),0.556 +/- 0.031 (in 3 folds),0.623 +/- 0.023 (in 3 folds),0.624 +/- 0.046 (in 3 folds),0.481 +/- 0.124 (in 3 folds),0.279 +/- 0.033 (in 3 folds),0.484,0.231,0.463 +/- 0.113 (in 3 folds),0.266 +/- 0.038 (in 3 folds),...,Unknown,184,7,191,0.036649,False,0.596 +/- 0.000 (in 1 folds),0.592 +/- 0.000 (in 1 folds),0.649 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds)


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/ethnicity_condensed_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv














GeneLocus.BCR TargetObsColumnEnum.age_group_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/age_group_healthy_only






















































































































































































































































































































































































































































































































































































































































































































































Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_cv,0.558 +/- 0.074 (in 3 folds),0.552 +/- 0.078 (in 3 folds),0.601 +/- 0.066 (in 3 folds),0.595 +/- 0.063 (in 3 folds),0.180 +/- 0.032 (in 3 folds),0.069 +/- 0.050 (in 3 folds),0.18,0.007,0.173 +/- 0.036 (in 3 folds),0.062 +/- 0.054 (in 3 folds),...,0.666 +/- 0.000 (in 1 folds),0.173,0.005,0.042,Unknown,183,8,191,0.041885,True
lasso_cv.decision_thresholds_tuned,0.558 +/- 0.074 (in 3 folds),0.552 +/- 0.078 (in 3 folds),0.601 +/- 0.066 (in 3 folds),0.595 +/- 0.063 (in 3 folds),0.199 +/- 0.060 (in 3 folds),0.092 +/- 0.084 (in 3 folds),0.202,0.042,0.192 +/- 0.067 (in 3 folds),0.091 +/- 0.085 (in 3 folds),...,0.666 +/- 0.000 (in 1 folds),0.194,0.039,0.042,Unknown,183,8,191,0.041885,True
linearsvm_ovr,0.555 +/- 0.073 (in 3 folds),0.552 +/- 0.077 (in 3 folds),0.613 +/- 0.060 (in 3 folds),0.607 +/- 0.060 (in 3 folds),0.213 +/- 0.096 (in 3 folds),0.074 +/- 0.105 (in 3 folds),0.214,0.046,0.208 +/- 0.097 (in 3 folds),0.072 +/- 0.106 (in 3 folds),...,0.638 +/- 0.038 (in 2 folds),0.209,0.043,0.021,Unknown,187,4,191,0.020942,True
linearsvm_ovr.decision_thresholds_tuned,0.555 +/- 0.073 (in 3 folds),0.552 +/- 0.077 (in 3 folds),0.613 +/- 0.060 (in 3 folds),0.607 +/- 0.060 (in 3 folds),0.218 +/- 0.021 (in 3 folds),0.124 +/- 0.023 (in 3 folds),0.219,0.074,0.214 +/- 0.027 (in 3 folds),0.125 +/- 0.022 (in 3 folds),...,0.638 +/- 0.038 (in 2 folds),0.215,0.072,0.021,Unknown,187,4,191,0.020942,True
elasticnet_cv,0.544 +/- 0.092 (in 3 folds),0.539 +/- 0.095 (in 3 folds),0.607 +/- 0.062 (in 3 folds),0.604 +/- 0.056 (in 3 folds),0.108 +/- 0.099 (in 3 folds),0.056 +/- 0.051 (in 3 folds),0.157,-0.008,0.105 +/- 0.098 (in 3 folds),0.036 +/- 0.064 (in 3 folds),...,0.668 +/- 0.000 (in 1 folds),0.11,-0.021,0.298,Unknown,134,57,191,0.298429,True
elasticnet_cv.decision_thresholds_tuned,0.544 +/- 0.092 (in 3 folds),0.539 +/- 0.095 (in 3 folds),0.607 +/- 0.062 (in 3 folds),0.604 +/- 0.056 (in 3 folds),0.210 +/- 0.054 (in 3 folds),0.081 +/- 0.100 (in 3 folds),0.216,0.065,0.146 +/- 0.126 (in 3 folds),0.068 +/- 0.112 (in 3 folds),...,0.668 +/- 0.000 (in 1 folds),0.152,0.035,0.298,Unknown,134,57,191,0.298429,True
lasso_multiclass,0.544 +/- 0.066 (in 3 folds),0.541 +/- 0.070 (in 3 folds),0.600 +/- 0.053 (in 3 folds),0.601 +/- 0.056 (in 3 folds),0.201 +/- 0.010 (in 3 folds),0.065 +/- 0.032 (in 3 folds),0.203,0.052,0.168 +/- 0.055 (in 3 folds),0.056 +/- 0.036 (in 3 folds),...,0.649 +/- 0.000 (in 1 folds),0.168,0.042,0.173,Unknown,158,33,191,0.172775,False
lasso_multiclass.decision_thresholds_tuned,0.544 +/- 0.066 (in 3 folds),0.541 +/- 0.070 (in 3 folds),0.600 +/- 0.053 (in 3 folds),0.601 +/- 0.056 (in 3 folds),0.200 +/- 0.048 (in 3 folds),0.081 +/- 0.065 (in 3 folds),0.209,0.05,0.172 +/- 0.081 (in 3 folds),0.073 +/- 0.073 (in 3 folds),...,0.649 +/- 0.000 (in 1 folds),0.173,0.038,0.173,Unknown,158,33,191,0.172775,True
ridge_cv,0.537 +/- 0.015 (in 3 folds),0.536 +/- 0.018 (in 3 folds),0.608 +/- 0.021 (in 3 folds),0.614 +/- 0.025 (in 3 folds),0.091 +/- 0.084 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.108,-0.051,0.045 +/- 0.055 (in 3 folds),-0.015 +/- 0.015 (in 3 folds),...,0.585 +/- 0.000 (in 1 folds),0.047,-0.061,0.565,Unknown,83,108,191,0.565445,True
ridge_cv.decision_thresholds_tuned,0.537 +/- 0.015 (in 3 folds),0.536 +/- 0.018 (in 3 folds),0.608 +/- 0.021 (in 3 folds),0.614 +/- 0.025 (in 3 folds),0.131 +/- 0.118 (in 3 folds),0.039 +/- 0.068 (in 3 folds),0.205,0.081,0.086 +/- 0.124 (in 3 folds),0.025 +/- 0.081 (in 3 folds),...,0.585 +/- 0.000 (in 1 folds),0.089,0.008,0.565,Unknown,83,108,191,0.565445,True


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/age_group_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.age_group_binary_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/age_group_binary_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
rf_multiclass,0.608 +/- 0.048 (in 3 folds),0.608 +/- 0.048 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.602 +/- 0.027 (in 3 folds),0.159 +/- 0.028 (in 3 folds),0.605,0.142,0.532 +/- 0.126 (in 3 folds),0.133 +/- 0.052 (in 3 folds),0.120 +/- 0.180 (in 3 folds),0.529,0.109,0.126,Unknown,167,24,191,0.125654,False
rf_multiclass.decision_thresholds_tuned,0.608 +/- 0.048 (in 3 folds),0.608 +/- 0.048 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.608 +/- 0.027 (in 3 folds),0.167 +/- 0.047 (in 3 folds),0.611,0.142,0.538 +/- 0.130 (in 3 folds),0.140 +/- 0.062 (in 3 folds),0.120 +/- 0.180 (in 3 folds),0.534,0.107,0.126,Unknown,167,24,191,0.125654,False
xgboost,0.607 +/- 0.069 (in 3 folds),0.607 +/- 0.069 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.581 +/- 0.004 (in 3 folds),0.172 +/- 0.072 (in 3 folds),0.581,0.137,0.476 +/- 0.091 (in 3 folds),0.128 +/- 0.058 (in 3 folds),0.181 +/- 0.156 (in 3 folds),0.471,0.096,0.188,Unknown,155,36,191,0.188482,False
xgboost.decision_thresholds_tuned,0.607 +/- 0.069 (in 3 folds),0.607 +/- 0.069 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.549 +/- 0.067 (in 3 folds),0.173 +/- 0.046 (in 3 folds),0.548,0.098,0.451 +/- 0.117 (in 3 folds),0.130 +/- 0.048 (in 3 folds),0.181 +/- 0.156 (in 3 folds),0.445,0.071,0.188,Unknown,155,36,191,0.188482,False
lasso_cv,0.598 +/- 0.100 (in 3 folds),0.598 +/- 0.100 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.531 +/- 0.082 (in 3 folds),0.048 +/- 0.135 (in 3 folds),0.56,0.086,0.356 +/- 0.205 (in 3 folds),0.029 +/- 0.106 (in 3 folds),0.362 +/- 0.314 (in 3 folds),0.366,0.049,0.346,Unknown,125,66,191,0.34555,False
lasso_cv.decision_thresholds_tuned,0.598 +/- 0.100 (in 3 folds),0.598 +/- 0.100 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.541 +/- 0.062 (in 3 folds),0.118 +/- 0.110 (in 3 folds),0.536,0.096,0.342 +/- 0.172 (in 3 folds),0.088 +/- 0.076 (in 3 folds),0.362 +/- 0.314 (in 3 folds),0.351,0.054,0.346,Unknown,125,66,191,0.34555,False
elasticnet_cv,0.576 +/- 0.083 (in 3 folds),0.576 +/- 0.083 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.400 +/- 0.040 (in 3 folds),0.009 +/- 0.015 (in 3 folds),0.396,0.019,0.186 +/- 0.089 (in 3 folds),0.035 +/- 0.056 (in 3 folds),0.531 +/- 0.223 (in 3 folds),0.188,0.02,0.524,Unknown,91,100,191,0.52356,False
elasticnet_cv.decision_thresholds_tuned,0.576 +/- 0.083 (in 3 folds),0.576 +/- 0.083 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.537 +/- 0.121 (in 3 folds),0.036 +/- 0.042 (in 3 folds),0.505,0.014,0.237 +/- 0.072 (in 3 folds),0.038 +/- 0.053 (in 3 folds),0.531 +/- 0.223 (in 3 folds),0.241,0.006,0.524,Unknown,91,100,191,0.52356,False
linearsvm_ovr,0.573 +/- 0.073 (in 3 folds),0.573 +/- 0.073 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.583 +/- 0.043 (in 3 folds),0.152 +/- 0.086 (in 3 folds),0.584,0.13,0.513 +/- 0.096 (in 3 folds),0.127 +/- 0.093 (in 3 folds),0.126 +/- 0.096 (in 3 folds),0.508,0.097,0.131,Unknown,166,25,191,0.13089,False
linearsvm_ovr.decision_thresholds_tuned,0.573 +/- 0.073 (in 3 folds),0.573 +/- 0.073 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.535 +/- 0.055 (in 3 folds),0.091 +/- 0.005 (in 3 folds),0.536,0.024,0.469 +/- 0.087 (in 3 folds),0.067 +/- 0.012 (in 3 folds),0.126 +/- 0.096 (in 3 folds),0.466,0.012,0.131,Unknown,166,25,191,0.13089,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/age_group_binary_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.sex_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/sex_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.549 +/- 0.090 (in 3 folds),0.549 +/- 0.090 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.553 +/- 0.073 (in 3 folds),0.082 +/- 0.156 (in 3 folds),0.542,0.075,0.470 +/- 0.019 (in 3 folds),0.048 +/- 0.097 (in 3 folds),...,,0.471,0.062,0.131,Unknown,166,25,191,0.13089,False
elasticnet_cv.decision_thresholds_tuned,0.549 +/- 0.090 (in 3 folds),0.549 +/- 0.090 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.496 +/- 0.035 (in 3 folds),-0.021 +/- 0.049 (in 3 folds),0.5,-0.04,0.430 +/- 0.089 (in 3 folds),-0.010 +/- 0.057 (in 3 folds),...,,0.435,-0.018,0.131,Unknown,166,25,191,0.13089,False
lasso_multiclass,0.545 +/- 0.054 (in 3 folds),0.545 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.546 +/- 0.040 (in 3 folds),0.086 +/- 0.109 (in 3 folds),0.543,0.081,0.530 +/- 0.019 (in 3 folds),0.075 +/- 0.094 (in 3 folds),...,0.536 +/- 0.000 (in 1 folds),0.529,0.076,0.026,Unknown,186,5,191,0.026178,False
lasso_multiclass.decision_thresholds_tuned,0.545 +/- 0.054 (in 3 folds),0.545 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.490 +/- 0.063 (in 3 folds),-0.039 +/- 0.134 (in 3 folds),0.495,-0.027,0.478 +/- 0.078 (in 3 folds),-0.016 +/- 0.107 (in 3 folds),...,0.536 +/- 0.000 (in 1 folds),0.482,-0.027,0.026,Unknown,186,5,191,0.026178,False
rf_multiclass,0.542 +/- 0.082 (in 3 folds),0.542 +/- 0.082 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.559 +/- 0.071 (in 3 folds),0.096 +/- 0.157 (in 3 folds),0.548,0.089,0.475 +/- 0.024 (in 3 folds),0.056 +/- 0.105 (in 3 folds),...,,0.476,0.072,0.131,Unknown,166,25,191,0.13089,False
rf_multiclass.decision_thresholds_tuned,0.542 +/- 0.082 (in 3 folds),0.542 +/- 0.082 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.534 +/- 0.042 (in 3 folds),0.090 +/- 0.086 (in 3 folds),0.536,0.047,0.461 +/- 0.087 (in 3 folds),0.060 +/- 0.066 (in 3 folds),...,,0.466,0.046,0.131,Unknown,166,25,191,0.13089,False
linearsvm_ovr,0.532 +/- 0.072 (in 3 folds),0.532 +/- 0.072 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.541 +/- 0.050 (in 3 folds),0.081 +/- 0.125 (in 3 folds),0.538,0.071,0.525 +/- 0.035 (in 3 folds),0.072 +/- 0.111 (in 3 folds),...,0.537 +/- 0.000 (in 1 folds),0.524,0.067,0.026,Unknown,186,5,191,0.026178,False
linearsvm_ovr.decision_thresholds_tuned,0.532 +/- 0.072 (in 3 folds),0.532 +/- 0.072 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.485 +/- 0.056 (in 3 folds),-0.031 +/- 0.125 (in 3 folds),0.489,-0.031,0.473 +/- 0.071 (in 3 folds),-0.008 +/- 0.093 (in 3 folds),...,0.537 +/- 0.000 (in 1 folds),0.476,-0.03,0.026,Unknown,186,5,191,0.026178,False
ridge_cv,0.488 +/- 0.030 (in 3 folds),0.488 +/- 0.030 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.548 +/- 0.014 (in 3 folds),0.009 +/- 0.015 (in 3 folds),0.547,0.092,0.429 +/- 0.153 (in 3 folds),0.069 +/- 0.037 (in 3 folds),...,,0.424,0.078,0.225,Unknown,148,43,191,0.225131,False
ridge_cv.decision_thresholds_tuned,0.488 +/- 0.030 (in 3 folds),0.488 +/- 0.030 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.479 +/- 0.060 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.466,-0.076,0.364 +/- 0.093 (in 3 folds),-0.002 +/- 0.093 (in 3 folds),...,,0.361,-0.041,0.225,Unknown,148,43,191,0.225131,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/sex_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv


2022-12-31 11:36:57,370 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.0.validation.h5ad -> /srv/scratch/maximz/cache/45c3001c6b505500991147d20f972274565d8728487b87ce1a92bfe9.0.validation.h5ad


GeneLocus.TCR
Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 12:20:45,188 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 35 specimens




2022-12-31 12:35:50,532 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 27 specimens




2022-12-31 12:53:28,796 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 34 specimens




2022-12-31 13:11:04,501 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 10 specimens (413445 rows)


2022-12-31 13:11:21,588 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 44 specimens




2022-12-31 13:24:09,874 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (11386 rows)


2022-12-31 13:24:28,693 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens




2022-12-31 13:38:31,714 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (11386 rows)


2022-12-31 13:38:48,716 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens




2022-12-31 13:50:56,985 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 48 specimens


2022-12-31 14:02:17,172 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.1.validation.h5ad -> /srv/scratch/maximz/cache/282f72b2420811c056ecfc2ef1dcbf10523046eb9569d7ff2d7c8263.1.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 14:50:53,748 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 36 specimens




2022-12-31 15:06:54,349 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 26 specimens




2022-12-31 15:25:37,021 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 34 specimens




2022-12-31 15:44:25,725 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 11 specimens (475392 rows)


2022-12-31 15:44:46,155 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 41 specimens




2022-12-31 15:59:18,964 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (18790 rows)


2022-12-31 15:59:41,270 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens




2022-12-31 16:14:24,317 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (18790 rows)


2022-12-31 16:14:47,123 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens




2022-12-31 16:28:41,695 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 48 specimens


2022-12-31 16:41:30,600 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.2.validation.h5ad -> /srv/scratch/maximz/cache/1ca7b8d5a7e7747e7f0bda4a4f3cb1e09d543670afe9d48fe77350c1.2.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 17:27:29,974 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 35 specimens




2022-12-31 17:43:04,141 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 27 specimens




2022-12-31 18:00:52,097 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 34 specimens




2022-12-31 18:19:15,541 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 11 specimens (476014 rows)


2022-12-31 18:19:36,280 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 42 specimens




2022-12-31 18:38:20,126 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (6847 rows)


2022-12-31 18:38:42,863 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens




2022-12-31 18:52:39,141 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (6847 rows)


2022-12-31 18:53:02,531 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens




2022-12-31 19:06:07,469 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 48 specimens


2022-12-31 19:18:10,260 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.-1.validation.h5ad -> /srv/scratch/maximz/cache/1985239f55fdf391d2f6c78098bab25182948ad31b330c01c26cb651.-1.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].




2022-12-31 19:22:07,545 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 19:22:07,549 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 19:22:07,552 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 19:22:07,555 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 19:22:07,557 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 19:22:07,559 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease/train_smaller_model.xgboost.-1.joblib'


2022-12-31 19:22:07,560 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 19:38:02,407 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease_all_demographics_present/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 19:38:02,418 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease_all_demographics_present/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 19:38:02,424 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease_all_demographics_present/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 19:38:02,429 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease_all_demographics_present/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 19:38:02,434 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease_all_demographics_present/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 19:38:02,439 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease_all_demographics_present/train_smaller_model.xgboost.-1.joblib'


2022-12-31 19:38:02,445 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/disease_all_demographics_present/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 19:41:38,909 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 55 specimens


2022-12-31 19:41:42,253 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/covid_vs_healthy/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 19:41:42,256 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/covid_vs_healthy/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 19:41:42,261 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/covid_vs_healthy/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 19:41:42,264 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/covid_vs_healthy/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 19:41:42,267 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/covid_vs_healthy/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 19:41:42,270 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/covid_vs_healthy/train_smaller_model.xgboost.-1.joblib'


2022-12-31 19:41:42,273 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/covid_vs_healthy/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 19:43:49,071 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 41 specimens


2022-12-31 19:43:51,989 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/hiv_vs_healthy/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 19:43:51,991 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/hiv_vs_healthy/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 19:43:51,992 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/hiv_vs_healthy/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 19:43:51,993 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/hiv_vs_healthy/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 19:43:51,994 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/hiv_vs_healthy/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 19:43:51,995 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/hiv_vs_healthy/train_smaller_model.xgboost.-1.joblib'


2022-12-31 19:43:51,996 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/hiv_vs_healthy/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 19:45:41,101 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 52 specimens


2022-12-31 19:45:43,431 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/lupus_vs_healthy/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 19:45:43,433 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/lupus_vs_healthy/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 19:45:43,434 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/lupus_vs_healthy/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 19:45:43,435 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/lupus_vs_healthy/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 19:45:43,436 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/lupus_vs_healthy/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 19:45:43,437 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/lupus_vs_healthy/train_smaller_model.xgboost.-1.joblib'


2022-12-31 19:45:43,438 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/lupus_vs_healthy/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 19:47:55,157 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 19 specimens (862171 rows)


2022-12-31 19:56:13,252 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 64 specimens


2022-12-31 20:02:50,770 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/ethnicity_condensed_healthy_only/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 20:02:50,772 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/ethnicity_condensed_healthy_only/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 20:02:50,773 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/ethnicity_condensed_healthy_only/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 20:02:50,775 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/ethnicity_condensed_healthy_only/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 20:02:50,776 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/ethnicity_condensed_healthy_only/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 20:02:50,778 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/ethnicity_condensed_healthy_only/train_smaller_model.xgboost.-1.joblib'


2022-12-31 20:02:50,779 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/ethnicity_condensed_healthy_only/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 20:04:50,487 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (6847 rows)


2022-12-31 20:05:26,259 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens


2022-12-31 20:09:22,819 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_healthy_only/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 20:09:22,821 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_healthy_only/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 20:09:22,823 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_healthy_only/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 20:09:22,824 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_healthy_only/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 20:09:22,825 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_healthy_only/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 20:09:22,825 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_healthy_only/train_smaller_model.xgboost.-1.joblib'


2022-12-31 20:09:22,827 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_healthy_only/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 20:11:22,729 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (6847 rows)


2022-12-31 20:11:50,952 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens


2022-12-31 20:12:26,405 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_binary_healthy_only/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 20:12:26,406 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_binary_healthy_only/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 20:12:26,408 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_binary_healthy_only/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 20:12:26,408 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_binary_healthy_only/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 20:12:26,409 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_binary_healthy_only/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 20:12:26,410 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_binary_healthy_only/train_smaller_model.xgboost.-1.joblib'


2022-12-31 20:12:26,411 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/age_group_binary_healthy_only/train_smaller_model.linearsvm_ovr.-1.joblib'




2022-12-31 20:14:02,971 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 74 specimens


2022-12-31 20:14:30,700 - malid.train.training_utils - INFO - Skipping lasso_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/sex_healthy_only/train_smaller_model.lasso_multiclass.-1.joblib'


2022-12-31 20:14:30,702 - malid.train.training_utils - INFO - Skipping lasso_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/sex_healthy_only/train_smaller_model.lasso_cv.-1.joblib'


2022-12-31 20:14:30,703 - malid.train.training_utils - INFO - Skipping ridge_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/sex_healthy_only/train_smaller_model.ridge_cv.-1.joblib'


2022-12-31 20:14:30,704 - malid.train.training_utils - INFO - Skipping elasticnet_cv from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/sex_healthy_only/train_smaller_model.elasticnet_cv.-1.joblib'


2022-12-31 20:14:30,705 - malid.train.training_utils - INFO - Skipping rf_multiclass from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/sex_healthy_only/train_smaller_model.rf_multiclass.-1.joblib'


2022-12-31 20:14:30,706 - malid.train.training_utils - INFO - Skipping xgboost from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/sex_healthy_only/train_smaller_model.xgboost.-1.joblib'


2022-12-31 20:14:30,707 - malid.train.training_utils - INFO - Skipping linearsvm_ovr from -1 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/convergent_clusters/TCR/sex_healthy_only/train_smaller_model.linearsvm_ovr.-1.joblib'


GeneLocus.TCR TargetObsColumnEnum.disease


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.923 +/- 0.009 (in 3 folds),0.926 +/- 0.007 (in 3 folds),0.920 +/- 0.013 (in 3 folds),0.927 +/- 0.010 (in 3 folds),0.755 +/- 0.028 (in 3 folds),0.637 +/- 0.048 (in 3 folds),0.755,0.635,274,0,274,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.923 +/- 0.009 (in 3 folds),0.926 +/- 0.007 (in 3 folds),0.920 +/- 0.013 (in 3 folds),0.927 +/- 0.010 (in 3 folds),0.814 +/- 0.018 (in 3 folds),0.745 +/- 0.023 (in 3 folds),0.814,0.741,274,0,274,0.0,False
lasso_multiclass,0.903 +/- 0.017 (in 3 folds),0.903 +/- 0.024 (in 3 folds),0.901 +/- 0.016 (in 3 folds),0.905 +/- 0.022 (in 3 folds),0.766 +/- 0.031 (in 3 folds),0.665 +/- 0.040 (in 3 folds),0.766,0.662,274,0,274,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.903 +/- 0.017 (in 3 folds),0.903 +/- 0.024 (in 3 folds),0.901 +/- 0.016 (in 3 folds),0.905 +/- 0.022 (in 3 folds),0.796 +/- 0.032 (in 3 folds),0.713 +/- 0.045 (in 3 folds),0.796,0.71,274,0,274,0.0,False
ridge_cv,0.894 +/- 0.018 (in 3 folds),0.902 +/- 0.018 (in 3 folds),0.879 +/- 0.017 (in 3 folds),0.891 +/- 0.017 (in 3 folds),0.536 +/- 0.069 (in 3 folds),0.209 +/- 0.195 (in 3 folds),0.536,0.253,274,0,274,0.0,False
ridge_cv.decision_thresholds_tuned,0.894 +/- 0.018 (in 3 folds),0.902 +/- 0.018 (in 3 folds),0.879 +/- 0.017 (in 3 folds),0.891 +/- 0.017 (in 3 folds),0.726 +/- 0.039 (in 3 folds),0.642 +/- 0.049 (in 3 folds),0.726,0.635,274,0,274,0.0,False
xgboost,0.891 +/- 0.011 (in 3 folds),0.886 +/- 0.013 (in 3 folds),0.889 +/- 0.011 (in 3 folds),0.890 +/- 0.012 (in 3 folds),0.730 +/- 0.034 (in 3 folds),0.607 +/- 0.050 (in 3 folds),0.73,0.597,274,0,274,0.0,False
xgboost.decision_thresholds_tuned,0.891 +/- 0.011 (in 3 folds),0.886 +/- 0.013 (in 3 folds),0.889 +/- 0.011 (in 3 folds),0.890 +/- 0.012 (in 3 folds),0.774 +/- 0.025 (in 3 folds),0.672 +/- 0.036 (in 3 folds),0.774,0.665,274,0,274,0.0,False
lasso_cv,0.881 +/- 0.019 (in 3 folds),0.887 +/- 0.012 (in 3 folds),0.874 +/- 0.017 (in 3 folds),0.884 +/- 0.015 (in 3 folds),0.632 +/- 0.063 (in 3 folds),0.432 +/- 0.105 (in 3 folds),0.631,0.433,274,0,274,0.0,False
lasso_cv.decision_thresholds_tuned,0.881 +/- 0.019 (in 3 folds),0.887 +/- 0.012 (in 3 folds),0.874 +/- 0.017 (in 3 folds),0.884 +/- 0.015 (in 3 folds),0.741 +/- 0.014 (in 3 folds),0.656 +/- 0.019 (in 3 folds),0.741,0.643,274,0,274,0.0,False


GeneLocus.TCR TargetObsColumnEnum.disease_all_demographics_present


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.907 +/- 0.009 (in 3 folds),0.906 +/- 0.016 (in 3 folds),0.889 +/- 0.006 (in 3 folds),0.892 +/- 0.002 (in 3 folds),0.749 +/- 0.028 (in 3 folds),0.639 +/- 0.055 (in 3 folds),0.749,0.636,0.746 +/- 0.029 (in 3 folds),0.636 +/- 0.056 (in 3 folds),...,0.893 +/- 0.001 (in 2 folds),0.746,0.633,0.004,Unknown,239,1,240,0.004167,False
linearsvm_ovr.decision_thresholds_tuned,0.907 +/- 0.009 (in 3 folds),0.906 +/- 0.016 (in 3 folds),0.889 +/- 0.006 (in 3 folds),0.892 +/- 0.002 (in 3 folds),0.791 +/- 0.010 (in 3 folds),0.707 +/- 0.023 (in 3 folds),0.791,0.706,0.787 +/- 0.014 (in 3 folds),0.704 +/- 0.027 (in 3 folds),...,0.893 +/- 0.001 (in 2 folds),0.787,0.702,0.004,Unknown,239,1,240,0.004167,False
lasso_multiclass,0.906 +/- 0.012 (in 3 folds),0.905 +/- 0.017 (in 3 folds),0.897 +/- 0.011 (in 3 folds),0.899 +/- 0.010 (in 3 folds),0.761 +/- 0.016 (in 3 folds),0.671 +/- 0.033 (in 3 folds),0.762,0.668,0.758 +/- 0.017 (in 3 folds),0.668 +/- 0.036 (in 3 folds),...,0.903 +/- 0.011 (in 2 folds),0.758,0.664,0.004,Unknown,239,1,240,0.004167,False
lasso_multiclass.decision_thresholds_tuned,0.906 +/- 0.012 (in 3 folds),0.905 +/- 0.017 (in 3 folds),0.897 +/- 0.011 (in 3 folds),0.899 +/- 0.010 (in 3 folds),0.795 +/- 0.017 (in 3 folds),0.715 +/- 0.033 (in 3 folds),0.795,0.712,0.792 +/- 0.021 (in 3 folds),0.712 +/- 0.038 (in 3 folds),...,0.903 +/- 0.011 (in 2 folds),0.792,0.708,0.004,Unknown,239,1,240,0.004167,False
ridge_cv,0.889 +/- 0.008 (in 3 folds),0.892 +/- 0.013 (in 3 folds),0.874 +/- 0.010 (in 3 folds),0.881 +/- 0.016 (in 3 folds),0.547 +/- 0.115 (in 3 folds),0.174 +/- 0.301 (in 3 folds),0.548,0.286,0.545 +/- 0.117 (in 3 folds),0.189 +/- 0.289 (in 3 folds),...,0.889 +/- 0.006 (in 2 folds),0.546,0.284,0.004,Unknown,239,1,240,0.004167,False
ridge_cv.decision_thresholds_tuned,0.889 +/- 0.008 (in 3 folds),0.892 +/- 0.013 (in 3 folds),0.874 +/- 0.010 (in 3 folds),0.881 +/- 0.016 (in 3 folds),0.534 +/- 0.280 (in 3 folds),0.379 +/- 0.357 (in 3 folds),0.536,0.392,0.531 +/- 0.279 (in 3 folds),0.377 +/- 0.357 (in 3 folds),...,0.889 +/- 0.006 (in 2 folds),0.533,0.391,0.004,Unknown,239,1,240,0.004167,False
xgboost,0.885 +/- 0.024 (in 3 folds),0.884 +/- 0.024 (in 3 folds),0.878 +/- 0.033 (in 3 folds),0.882 +/- 0.032 (in 3 folds),0.758 +/- 0.031 (in 3 folds),0.643 +/- 0.046 (in 3 folds),0.758,0.638,,,...,,,,,,240,0,240,0.0,False
xgboost.decision_thresholds_tuned,0.885 +/- 0.024 (in 3 folds),0.884 +/- 0.024 (in 3 folds),0.878 +/- 0.033 (in 3 folds),0.882 +/- 0.032 (in 3 folds),0.796 +/- 0.012 (in 3 folds),0.709 +/- 0.002 (in 3 folds),0.796,0.704,,,...,,,,,,240,0,240,0.0,False
rf_multiclass,0.885 +/- 0.014 (in 3 folds),0.882 +/- 0.008 (in 3 folds),0.881 +/- 0.016 (in 3 folds),0.879 +/- 0.009 (in 3 folds),0.716 +/- 0.022 (in 3 folds),0.573 +/- 0.032 (in 3 folds),0.715,0.571,0.713 +/- 0.019 (in 3 folds),0.569 +/- 0.027 (in 3 folds),...,0.879 +/- 0.013 (in 2 folds),0.713,0.568,0.004,Unknown,239,1,240,0.004167,False
rf_multiclass.decision_thresholds_tuned,0.885 +/- 0.014 (in 3 folds),0.882 +/- 0.008 (in 3 folds),0.881 +/- 0.016 (in 3 folds),0.879 +/- 0.009 (in 3 folds),0.787 +/- 0.020 (in 3 folds),0.702 +/- 0.041 (in 3 folds),0.787,0.697,0.783 +/- 0.015 (in 3 folds),0.698 +/- 0.037 (in 3 folds),...,0.879 +/- 0.013 (in 2 folds),0.783,0.693,0.004,Unknown,239,1,240,0.004167,False


GeneLocus.TCR TargetObsColumnEnum.covid_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.964 +/- 0.039 (in 3 folds),0.964 +/- 0.039 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.923 +/- 0.044 (in 3 folds),0.799 +/- 0.095 (in 3 folds),0.923,0.791,168,0,168,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.964 +/- 0.039 (in 3 folds),0.964 +/- 0.039 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.935 +/- 0.053 (in 3 folds),0.836 +/- 0.121 (in 3 folds),0.935,0.83,168,0,168,0.0,False
linearsvm_ovr,0.964 +/- 0.039 (in 3 folds),0.964 +/- 0.039 (in 3 folds),0.991 +/- 0.010 (in 3 folds),0.991 +/- 0.010 (in 3 folds),0.911 +/- 0.063 (in 3 folds),0.791 +/- 0.107 (in 3 folds),0.911,0.772,168,0,168,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.964 +/- 0.039 (in 3 folds),0.964 +/- 0.039 (in 3 folds),0.991 +/- 0.010 (in 3 folds),0.991 +/- 0.010 (in 3 folds),0.947 +/- 0.035 (in 3 folds),0.858 +/- 0.088 (in 3 folds),0.946,0.857,168,0,168,0.0,False
lasso_cv,0.962 +/- 0.040 (in 3 folds),0.962 +/- 0.040 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.815 +/- 0.028 (in 3 folds),0.382 +/- 0.148 (in 3 folds),0.815,0.385,168,0,168,0.0,False
lasso_cv.decision_thresholds_tuned,0.962 +/- 0.040 (in 3 folds),0.962 +/- 0.040 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.929 +/- 0.052 (in 3 folds),0.832 +/- 0.109 (in 3 folds),0.929,0.823,168,0,168,0.0,False
xgboost,0.962 +/- 0.029 (in 3 folds),0.962 +/- 0.029 (in 3 folds),0.987 +/- 0.008 (in 3 folds),0.987 +/- 0.008 (in 3 folds),0.905 +/- 0.019 (in 3 folds),0.736 +/- 0.046 (in 3 folds),0.905,0.719,168,0,168,0.0,False
xgboost.decision_thresholds_tuned,0.962 +/- 0.029 (in 3 folds),0.962 +/- 0.029 (in 3 folds),0.987 +/- 0.008 (in 3 folds),0.987 +/- 0.008 (in 3 folds),0.935 +/- 0.036 (in 3 folds),0.826 +/- 0.079 (in 3 folds),0.935,0.819,168,0,168,0.0,False
elasticnet_cv,0.960 +/- 0.040 (in 3 folds),0.960 +/- 0.040 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.815 +/- 0.041 (in 3 folds),0.328 +/- 0.288 (in 3 folds),0.815,0.385,168,0,168,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.960 +/- 0.040 (in 3 folds),0.960 +/- 0.040 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.923 +/- 0.054 (in 3 folds),0.827 +/- 0.111 (in 3 folds),0.923,0.819,168,0,168,0.0,False


GeneLocus.TCR TargetObsColumnEnum.hiv_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.881 +/- 0.023 (in 3 folds),0.881 +/- 0.023 (in 3 folds),0.942 +/- 0.009 (in 3 folds),0.942 +/- 0.009 (in 3 folds),0.783 +/- 0.017 (in 3 folds),0.529 +/- 0.028 (in 3 folds),0.784,0.5,194,0,194,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.881 +/- 0.023 (in 3 folds),0.881 +/- 0.023 (in 3 folds),0.942 +/- 0.009 (in 3 folds),0.942 +/- 0.009 (in 3 folds),0.814 +/- 0.054 (in 3 folds),0.644 +/- 0.073 (in 3 folds),0.814,0.638,194,0,194,0.0,False
lasso_multiclass,0.873 +/- 0.023 (in 3 folds),0.873 +/- 0.023 (in 3 folds),0.939 +/- 0.007 (in 3 folds),0.939 +/- 0.007 (in 3 folds),0.768 +/- 0.017 (in 3 folds),0.511 +/- 0.015 (in 3 folds),0.768,0.506,194,0,194,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.873 +/- 0.023 (in 3 folds),0.873 +/- 0.023 (in 3 folds),0.939 +/- 0.007 (in 3 folds),0.939 +/- 0.007 (in 3 folds),0.809 +/- 0.016 (in 3 folds),0.598 +/- 0.003 (in 3 folds),0.809,0.591,194,0,194,0.0,False
lasso_cv,0.857 +/- 0.011 (in 3 folds),0.857 +/- 0.011 (in 3 folds),0.934 +/- 0.004 (in 3 folds),0.934 +/- 0.004 (in 3 folds),0.773 +/- 0.017 (in 3 folds),0.465 +/- 0.061 (in 3 folds),0.773,0.462,194,0,194,0.0,False
lasso_cv.decision_thresholds_tuned,0.857 +/- 0.011 (in 3 folds),0.857 +/- 0.011 (in 3 folds),0.934 +/- 0.004 (in 3 folds),0.934 +/- 0.004 (in 3 folds),0.789 +/- 0.017 (in 3 folds),0.579 +/- 0.029 (in 3 folds),0.789,0.574,194,0,194,0.0,False
elasticnet_cv,0.854 +/- 0.012 (in 3 folds),0.854 +/- 0.012 (in 3 folds),0.933 +/- 0.005 (in 3 folds),0.933 +/- 0.005 (in 3 folds),0.768 +/- 0.016 (in 3 folds),0.451 +/- 0.051 (in 3 folds),0.768,0.448,194,0,194,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.854 +/- 0.012 (in 3 folds),0.854 +/- 0.012 (in 3 folds),0.933 +/- 0.005 (in 3 folds),0.933 +/- 0.005 (in 3 folds),0.789 +/- 0.017 (in 3 folds),0.579 +/- 0.029 (in 3 folds),0.789,0.574,194,0,194,0.0,False
ridge_cv,0.853 +/- 0.045 (in 3 folds),0.853 +/- 0.045 (in 3 folds),0.930 +/- 0.016 (in 3 folds),0.930 +/- 0.016 (in 3 folds),0.696 +/- 0.047 (in 3 folds),0.132 +/- 0.228 (in 3 folds),0.696,0.217,194,0,194,0.0,False
ridge_cv.decision_thresholds_tuned,0.853 +/- 0.045 (in 3 folds),0.853 +/- 0.045 (in 3 folds),0.930 +/- 0.016 (in 3 folds),0.930 +/- 0.016 (in 3 folds),0.727 +/- 0.101 (in 3 folds),0.213 +/- 0.369 (in 3 folds),0.727,0.322,194,0,194,0.0,False


GeneLocus.TCR TargetObsColumnEnum.lupus_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.951 +/- 0.033 (in 3 folds),0.951 +/- 0.033 (in 3 folds),0.892 +/- 0.058 (in 3 folds),0.892 +/- 0.058 (in 3 folds),0.788 +/- 0.020 (in 3 folds),0.249 +/- 0.219 (in 3 folds),0.788,0.309,0.779 +/- 0.021 (in 3 folds),0.264 +/- 0.127 (in 3 folds),...,Unknown,170,2,172,0.011628,False,0.913 +/- 0.000 (in 1 folds),0.913 +/- 0.000 (in 1 folds),0.825 +/- 0.000 (in 1 folds),0.825 +/- 0.000 (in 1 folds)
elasticnet_cv.decision_thresholds_tuned,0.951 +/- 0.033 (in 3 folds),0.951 +/- 0.033 (in 3 folds),0.892 +/- 0.058 (in 3 folds),0.892 +/- 0.058 (in 3 folds),0.918 +/- 0.036 (in 3 folds),0.776 +/- 0.091 (in 3 folds),0.918,0.769,0.907 +/- 0.027 (in 3 folds),0.751 +/- 0.069 (in 3 folds),...,Unknown,170,2,172,0.011628,False,0.913 +/- 0.000 (in 1 folds),0.913 +/- 0.000 (in 1 folds),0.825 +/- 0.000 (in 1 folds),0.825 +/- 0.000 (in 1 folds)
ridge_cv,0.945 +/- 0.029 (in 3 folds),0.945 +/- 0.029 (in 3 folds),0.875 +/- 0.054 (in 3 folds),0.875 +/- 0.054 (in 3 folds),0.759 +/- 0.008 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.759,0.0,0.750 +/- 0.008 (in 3 folds),0.027 +/- 0.081 (in 3 folds),...,Unknown,170,2,172,0.011628,True,0.913 +/- 0.000 (in 1 folds),0.913 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds)
ridge_cv.decision_thresholds_tuned,0.945 +/- 0.029 (in 3 folds),0.945 +/- 0.029 (in 3 folds),0.875 +/- 0.054 (in 3 folds),0.875 +/- 0.054 (in 3 folds),0.759 +/- 0.008 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.759,0.0,0.750 +/- 0.008 (in 3 folds),0.027 +/- 0.081 (in 3 folds),...,Unknown,170,2,172,0.011628,True,0.913 +/- 0.000 (in 1 folds),0.913 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds)
lasso_multiclass,0.925 +/- 0.080 (in 3 folds),0.925 +/- 0.080 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.892 +/- 0.038 (in 3 folds),0.708 +/- 0.096 (in 3 folds),0.893,0.701,0.872 +/- 0.045 (in 3 folds),0.665 +/- 0.100 (in 3 folds),...,Unknown,168,4,172,0.023256,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.925 +/- 0.080 (in 3 folds),0.925 +/- 0.080 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.916 +/- 0.039 (in 3 folds),0.767 +/- 0.108 (in 3 folds),0.917,0.766,0.895 +/- 0.047 (in 3 folds),0.716 +/- 0.123 (in 3 folds),...,Unknown,168,4,172,0.023256,False,,,,
linearsvm_ovr,0.925 +/- 0.080 (in 3 folds),0.925 +/- 0.080 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.898 +/- 0.047 (in 3 folds),0.724 +/- 0.122 (in 3 folds),0.899,0.72,0.878 +/- 0.053 (in 3 folds),0.681 +/- 0.125 (in 3 folds),...,Unknown,168,4,172,0.023256,False,,,,
linearsvm_ovr.decision_thresholds_tuned,0.925 +/- 0.080 (in 3 folds),0.925 +/- 0.080 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.916 +/- 0.039 (in 3 folds),0.767 +/- 0.108 (in 3 folds),0.917,0.766,0.895 +/- 0.047 (in 3 folds),0.716 +/- 0.123 (in 3 folds),...,Unknown,168,4,172,0.023256,False,,,,
lasso_cv,0.919 +/- 0.021 (in 3 folds),0.919 +/- 0.021 (in 3 folds),0.825 +/- 0.047 (in 3 folds),0.825 +/- 0.047 (in 3 folds),0.840 +/- 0.061 (in 3 folds),0.507 +/- 0.220 (in 3 folds),0.84,0.531,0.825 +/- 0.048 (in 3 folds),0.474 +/- 0.170 (in 3 folds),...,Unknown,169,3,172,0.017442,False,0.908 +/- 0.000 (in 1 folds),0.908 +/- 0.000 (in 1 folds),0.803 +/- 0.000 (in 1 folds),0.803 +/- 0.000 (in 1 folds)
lasso_cv.decision_thresholds_tuned,0.919 +/- 0.021 (in 3 folds),0.919 +/- 0.021 (in 3 folds),0.825 +/- 0.047 (in 3 folds),0.825 +/- 0.047 (in 3 folds),0.882 +/- 0.026 (in 3 folds),0.675 +/- 0.072 (in 3 folds),0.882,0.665,0.866 +/- 0.011 (in 3 folds),0.637 +/- 0.030 (in 3 folds),...,Unknown,169,3,172,0.017442,False,0.908 +/- 0.000 (in 1 folds),0.908 +/- 0.000 (in 1 folds),0.803 +/- 0.000 (in 1 folds),0.803 +/- 0.000 (in 1 folds)


GeneLocus.TCR TargetObsColumnEnum.ethnicity_condensed_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,...,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
xgboost,0.702 +/- 0.041 (in 3 folds),0.690 +/- 0.038 (in 3 folds),0.709 +/- 0.024 (in 3 folds),0.707 +/- 0.009 (in 3 folds),0.601 +/- 0.097 (in 3 folds),0.357 +/- 0.084 (in 3 folds),0.598,0.345,0.657 +/- 0.000 (in 1 folds),0.651 +/- 0.000 (in 1 folds),...,0.103 +/- 0.036 (in 2 folds),0.557,0.273,0.07,Unknown,107,8,115,0.069565,False
xgboost.decision_thresholds_tuned,0.702 +/- 0.041 (in 3 folds),0.690 +/- 0.038 (in 3 folds),0.709 +/- 0.024 (in 3 folds),0.707 +/- 0.009 (in 3 folds),0.639 +/- 0.126 (in 3 folds),0.444 +/- 0.163 (in 3 folds),0.636,0.44,0.657 +/- 0.000 (in 1 folds),0.651 +/- 0.000 (in 1 folds),...,0.103 +/- 0.036 (in 2 folds),0.591,0.342,0.07,Unknown,107,8,115,0.069565,False
linearsvm_ovr,0.692 +/- 0.052 (in 3 folds),0.697 +/- 0.058 (in 3 folds),0.716 +/- 0.018 (in 3 folds),0.725 +/- 0.040 (in 3 folds),0.583 +/- 0.078 (in 3 folds),0.331 +/- 0.086 (in 3 folds),0.584,0.338,0.718 +/- 0.038 (in 2 folds),0.723 +/- 0.050 (in 2 folds),...,0.051 +/- 0.000 (in 1 folds),0.574,0.292,0.017,Unknown,113,2,115,0.017391,True
linearsvm_ovr.decision_thresholds_tuned,0.692 +/- 0.052 (in 3 folds),0.697 +/- 0.058 (in 3 folds),0.716 +/- 0.018 (in 3 folds),0.725 +/- 0.040 (in 3 folds),0.663 +/- 0.025 (in 3 folds),0.461 +/- 0.064 (in 3 folds),0.664,0.474,0.718 +/- 0.038 (in 2 folds),0.723 +/- 0.050 (in 2 folds),...,0.051 +/- 0.000 (in 1 folds),0.652,0.443,0.017,Unknown,113,2,115,0.017391,True
lasso_multiclass,0.673 +/- 0.018 (in 3 folds),0.662 +/- 0.012 (in 3 folds),0.684 +/- 0.015 (in 3 folds),0.673 +/- 0.010 (in 3 folds),0.600 +/- 0.090 (in 3 folds),0.371 +/- 0.103 (in 3 folds),0.602,0.382,0.683 +/- 0.005 (in 2 folds),0.668 +/- 0.005 (in 2 folds),...,0.051 +/- 0.000 (in 1 folds),0.591,0.336,0.017,Unknown,113,2,115,0.017391,True
lasso_multiclass.decision_thresholds_tuned,0.673 +/- 0.018 (in 3 folds),0.662 +/- 0.012 (in 3 folds),0.684 +/- 0.015 (in 3 folds),0.673 +/- 0.010 (in 3 folds),0.690 +/- 0.036 (in 3 folds),0.516 +/- 0.031 (in 3 folds),0.69,0.512,0.683 +/- 0.005 (in 2 folds),0.668 +/- 0.005 (in 2 folds),...,0.051 +/- 0.000 (in 1 folds),0.678,0.487,0.017,Unknown,113,2,115,0.017391,True
lasso_cv,0.622 +/- 0.073 (in 3 folds),0.612 +/- 0.068 (in 3 folds),0.669 +/- 0.052 (in 3 folds),0.663 +/- 0.048 (in 3 folds),0.541 +/- 0.133 (in 3 folds),0.273 +/- 0.104 (in 3 folds),0.546,0.263,0.645 +/- 0.000 (in 1 folds),0.639 +/- 0.000 (in 1 folds),...,0.093 +/- 0.022 (in 2 folds),0.513,0.154,0.061,Unknown,108,7,115,0.06087,True
lasso_cv.decision_thresholds_tuned,0.622 +/- 0.073 (in 3 folds),0.612 +/- 0.068 (in 3 folds),0.669 +/- 0.052 (in 3 folds),0.663 +/- 0.048 (in 3 folds),0.624 +/- 0.102 (in 3 folds),0.436 +/- 0.095 (in 3 folds),0.63,0.44,0.645 +/- 0.000 (in 1 folds),0.639 +/- 0.000 (in 1 folds),...,0.093 +/- 0.022 (in 2 folds),0.591,0.345,0.061,Unknown,108,7,115,0.06087,True
rf_multiclass,0.612 +/- 0.089 (in 3 folds),0.609 +/- 0.066 (in 3 folds),0.640 +/- 0.048 (in 3 folds),0.629 +/- 0.038 (in 3 folds),0.597 +/- 0.145 (in 3 folds),0.381 +/- 0.173 (in 3 folds),0.591,0.365,0.562 +/- 0.025 (in 2 folds),0.572 +/- 0.024 (in 2 folds),...,0.128 +/- 0.000 (in 1 folds),0.565,0.284,0.043,Unknown,110,5,115,0.043478,True
rf_multiclass.decision_thresholds_tuned,0.612 +/- 0.089 (in 3 folds),0.609 +/- 0.066 (in 3 folds),0.640 +/- 0.048 (in 3 folds),0.629 +/- 0.038 (in 3 folds),0.571 +/- 0.172 (in 3 folds),0.384 +/- 0.171 (in 3 folds),0.564,0.295,0.562 +/- 0.025 (in 2 folds),0.572 +/- 0.024 (in 2 folds),...,0.128 +/- 0.000 (in 1 folds),0.539,0.272,0.043,Unknown,110,5,115,0.043478,False














GeneLocus.TCR TargetObsColumnEnum.age_group_healthy_only






















































































































































































































































































































































































































































Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,...,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.624 +/- 0.021 (in 3 folds),0.604 +/- 0.014 (in 3 folds),0.691 +/- 0.012 (in 3 folds),0.675 +/- 0.013 (in 3 folds),0.324 +/- 0.035 (in 3 folds),0.250 +/- 0.044 (in 3 folds),0.325,0.194,0.632 +/- 0.021 (in 2 folds),0.612 +/- 0.000 (in 2 folds),...,0.026 +/- 0.000 (in 1 folds),0.322,0.193,0.009,Unknown,114,1,115,0.008696,True
lasso_multiclass.decision_thresholds_tuned,0.624 +/- 0.021 (in 3 folds),0.604 +/- 0.014 (in 3 folds),0.691 +/- 0.012 (in 3 folds),0.675 +/- 0.013 (in 3 folds),0.456 +/- 0.021 (in 3 folds),0.395 +/- 0.050 (in 3 folds),0.456,0.355,0.632 +/- 0.021 (in 2 folds),0.612 +/- 0.000 (in 2 folds),...,0.026 +/- 0.000 (in 1 folds),0.452,0.353,0.009,Unknown,114,1,115,0.008696,True
lasso_cv,0.619 +/- 0.035 (in 3 folds),0.604 +/- 0.031 (in 3 folds),0.692 +/- 0.014 (in 3 folds),0.681 +/- 0.011 (in 3 folds),0.298 +/- 0.053 (in 3 folds),0.253 +/- 0.029 (in 3 folds),0.298,0.184,0.624 +/- 0.048 (in 2 folds),0.610 +/- 0.041 (in 2 folds),...,0.026 +/- 0.000 (in 1 folds),0.296,0.183,0.009,Unknown,114,1,115,0.008696,True
lasso_cv.decision_thresholds_tuned,0.619 +/- 0.035 (in 3 folds),0.604 +/- 0.031 (in 3 folds),0.692 +/- 0.014 (in 3 folds),0.681 +/- 0.011 (in 3 folds),0.430 +/- 0.038 (in 3 folds),0.374 +/- 0.037 (in 3 folds),0.43,0.331,0.624 +/- 0.048 (in 2 folds),0.610 +/- 0.041 (in 2 folds),...,0.026 +/- 0.000 (in 1 folds),0.426,0.328,0.009,Unknown,114,1,115,0.008696,True
rf_multiclass,0.615 +/- 0.026 (in 3 folds),0.598 +/- 0.030 (in 3 folds),0.657 +/- 0.011 (in 3 folds),0.644 +/- 0.015 (in 3 folds),0.324 +/- 0.009 (in 3 folds),0.230 +/- 0.005 (in 3 folds),0.325,0.18,0.629 +/- 0.012 (in 2 folds),0.611 +/- 0.027 (in 2 folds),...,0.026 +/- 0.000 (in 1 folds),0.322,0.179,0.009,Unknown,114,1,115,0.008696,True
rf_multiclass.decision_thresholds_tuned,0.615 +/- 0.026 (in 3 folds),0.598 +/- 0.030 (in 3 folds),0.657 +/- 0.011 (in 3 folds),0.644 +/- 0.015 (in 3 folds),0.394 +/- 0.087 (in 3 folds),0.372 +/- 0.048 (in 3 folds),0.395,0.303,0.629 +/- 0.012 (in 2 folds),0.611 +/- 0.027 (in 2 folds),...,0.026 +/- 0.000 (in 1 folds),0.391,0.301,0.009,Unknown,114,1,115,0.008696,True
xgboost,0.606 +/- 0.062 (in 3 folds),0.581 +/- 0.065 (in 3 folds),0.660 +/- 0.051 (in 3 folds),0.646 +/- 0.060 (in 3 folds),0.357 +/- 0.035 (in 3 folds),0.228 +/- 0.062 (in 3 folds),0.355,0.217,0.655 +/- 0.000 (in 1 folds),0.647 +/- 0.000 (in 1 folds),...,0.103 +/- 0.073 (in 2 folds),0.33,0.2,0.07,Unknown,107,8,115,0.069565,True
xgboost.decision_thresholds_tuned,0.606 +/- 0.062 (in 3 folds),0.581 +/- 0.065 (in 3 folds),0.660 +/- 0.051 (in 3 folds),0.646 +/- 0.060 (in 3 folds),0.484 +/- 0.058 (in 3 folds),0.406 +/- 0.044 (in 3 folds),0.486,0.384,0.655 +/- 0.000 (in 1 folds),0.647 +/- 0.000 (in 1 folds),...,0.103 +/- 0.073 (in 2 folds),0.452,0.35,0.07,Unknown,107,8,115,0.069565,True
linearsvm_ovr,0.604 +/- 0.010 (in 3 folds),0.580 +/- 0.022 (in 3 folds),0.664 +/- 0.031 (in 3 folds),0.646 +/- 0.040 (in 3 folds),0.355 +/- 0.040 (in 3 folds),0.240 +/- 0.050 (in 3 folds),0.355,0.213,0.602 +/- 0.000 (in 1 folds),0.587 +/- 0.000 (in 1 folds),...,0.064 +/- 0.054 (in 2 folds),0.339,0.204,0.043,Unknown,110,5,115,0.043478,True
linearsvm_ovr.decision_thresholds_tuned,0.604 +/- 0.010 (in 3 folds),0.580 +/- 0.022 (in 3 folds),0.664 +/- 0.031 (in 3 folds),0.646 +/- 0.040 (in 3 folds),0.500 +/- 0.014 (in 3 folds),0.420 +/- 0.032 (in 3 folds),0.5,0.41,0.602 +/- 0.000 (in 1 folds),0.587 +/- 0.000 (in 1 folds),...,0.064 +/- 0.054 (in 2 folds),0.478,0.386,0.043,Unknown,110,5,115,0.043478,True




2022-12-31 20:14:50,151 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,163 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.


GeneLocus.TCR TargetObsColumnEnum.age_group_binary_healthy_only




2022-12-31 20:14:50,199 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,206 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,233 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,240 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,272 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,280 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,314 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,322 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,356 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,367 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,397 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,404 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,441 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,449 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,479 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,494 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,534 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,546 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,581 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,591 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,636 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric rocauc: Only one class present in y_true. Probability-based score is not defined in that case.




2022-12-31 20:14:50,645 - malid.external.model_evaluation - ERROR - Error in evaluating predict-proba-based metric auprc: Only one class present in y_true. Probability-based score is not defined in that case.


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,...,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.755 +/- 0.061 (in 3 folds),0.755 +/- 0.061 (in 3 folds),0.871 +/- 0.049 (in 3 folds),0.871 +/- 0.049 (in 3 folds),0.697 +/- 0.036 (in 3 folds),0.339 +/- 0.076 (in 3 folds),0.696,0.331,0.801 +/- 0.000 (in 1 folds),0.801 +/- 0.000 (in 1 folds),...,0.038 +/- 0.018 (in 2 folds),0.678,0.313,0.026,Unknown,112,3,115,0.026087,False
lasso_multiclass.decision_thresholds_tuned,0.755 +/- 0.061 (in 3 folds),0.755 +/- 0.061 (in 3 folds),0.871 +/- 0.049 (in 3 folds),0.871 +/- 0.049 (in 3 folds),0.724 +/- 0.081 (in 3 folds),0.500 +/- 0.128 (in 3 folds),0.723,0.469,0.801 +/- 0.000 (in 1 folds),0.801 +/- 0.000 (in 1 folds),...,0.038 +/- 0.018 (in 2 folds),0.704,0.445,0.026,Unknown,112,3,115,0.026087,False
linearsvm_ovr,0.743 +/- 0.055 (in 3 folds),0.743 +/- 0.055 (in 3 folds),0.864 +/- 0.029 (in 3 folds),0.864 +/- 0.029 (in 3 folds),0.706 +/- 0.050 (in 3 folds),0.334 +/- 0.134 (in 3 folds),0.705,0.34,0.745 +/- 0.000 (in 1 folds),0.745 +/- 0.000 (in 1 folds),...,0.038 +/- 0.018 (in 2 folds),0.687,0.32,0.026,Unknown,112,3,115,0.026087,False
linearsvm_ovr.decision_thresholds_tuned,0.743 +/- 0.055 (in 3 folds),0.743 +/- 0.055 (in 3 folds),0.864 +/- 0.029 (in 3 folds),0.864 +/- 0.029 (in 3 folds),0.715 +/- 0.077 (in 3 folds),0.442 +/- 0.096 (in 3 folds),0.714,0.423,0.745 +/- 0.000 (in 1 folds),0.745 +/- 0.000 (in 1 folds),...,0.038 +/- 0.018 (in 2 folds),0.696,0.402,0.026,Unknown,112,3,115,0.026087,False
elasticnet_cv,0.701 +/- 0.136 (in 2 folds),0.701 +/- 0.136 (in 2 folds),0.820 +/- 0.076 (in 2 folds),0.820 +/- 0.076 (in 2 folds),0.781 +/- 0.190 (in 3 folds),0.101 +/- 0.174 (in 3 folds),0.714,0.256,,,...,0.277 +/- 0.369 (in 3 folds),0.522,0.146,0.27,Unknown,84,31,115,0.269565,False
elasticnet_cv.decision_thresholds_tuned,0.701 +/- 0.136 (in 2 folds),0.701 +/- 0.136 (in 2 folds),0.820 +/- 0.076 (in 2 folds),0.820 +/- 0.076 (in 2 folds),0.734 +/- 0.278 (in 3 folds),0.245 +/- 0.243 (in 3 folds),0.655,0.35,,,...,0.277 +/- 0.369 (in 3 folds),0.478,0.216,0.27,Unknown,84,31,115,0.269565,False
ridge_cv,0.690 +/- 0.117 (in 2 folds),0.690 +/- 0.117 (in 2 folds),0.811 +/- 0.054 (in 2 folds),0.811 +/- 0.054 (in 2 folds),0.754 +/- 0.216 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.679,0.0,,,...,0.277 +/- 0.369 (in 3 folds),0.496,0.046,0.27,Unknown,84,31,115,0.269565,True
ridge_cv.decision_thresholds_tuned,0.690 +/- 0.117 (in 2 folds),0.690 +/- 0.117 (in 2 folds),0.811 +/- 0.054 (in 2 folds),0.811 +/- 0.054 (in 2 folds),0.808 +/- 0.172 (in 3 folds),0.162 +/- 0.281 (in 3 folds),0.75,0.375,,,...,0.277 +/- 0.369 (in 3 folds),0.548,0.212,0.27,Unknown,84,31,115,0.269565,False
lasso_cv,0.688 +/- 0.119 (in 2 folds),0.688 +/- 0.119 (in 2 folds),0.807 +/- 0.058 (in 2 folds),0.807 +/- 0.058 (in 2 folds),0.808 +/- 0.172 (in 3 folds),0.204 +/- 0.253 (in 3 folds),0.75,0.38,,,...,0.277 +/- 0.369 (in 3 folds),0.548,0.226,0.27,Unknown,84,31,115,0.269565,False
lasso_cv.decision_thresholds_tuned,0.688 +/- 0.119 (in 2 folds),0.688 +/- 0.119 (in 2 folds),0.807 +/- 0.058 (in 2 folds),0.807 +/- 0.058 (in 2 folds),0.734 +/- 0.278 (in 3 folds),0.245 +/- 0.243 (in 3 folds),0.655,0.35,,,...,0.277 +/- 0.369 (in 3 folds),0.478,0.216,0.27,Unknown,84,31,115,0.269565,False


GeneLocus.TCR TargetObsColumnEnum.sex_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
linearsvm_ovr,0.598 +/- 0.035 (in 3 folds),0.598 +/- 0.035 (in 3 folds),0.591 +/- 0.133 (in 3 folds),0.591 +/- 0.133 (in 3 folds),0.576 +/- 0.132 (in 3 folds),0.192 +/- 0.117 (in 3 folds),0.577,0.162,0.556 +/- 0.129 (in 3 folds),0.179 +/- 0.102 (in 3 folds),...,Unknown,111,4,115,0.034783,False,,,,
linearsvm_ovr.decision_thresholds_tuned,0.598 +/- 0.035 (in 3 folds),0.598 +/- 0.035 (in 3 folds),0.591 +/- 0.133 (in 3 folds),0.591 +/- 0.133 (in 3 folds),0.664 +/- 0.096 (in 3 folds),0.344 +/- 0.057 (in 3 folds),0.667,0.365,0.642 +/- 0.102 (in 3 folds),0.301 +/- 0.071 (in 3 folds),...,Unknown,111,4,115,0.034783,False,,,,
lasso_multiclass,0.594 +/- 0.052 (in 3 folds),0.594 +/- 0.052 (in 3 folds),0.602 +/- 0.132 (in 3 folds),0.602 +/- 0.132 (in 3 folds),0.543 +/- 0.085 (in 3 folds),0.160 +/- 0.070 (in 3 folds),0.541,0.078,0.514 +/- 0.068 (in 3 folds),0.145 +/- 0.050 (in 3 folds),...,Unknown,109,6,115,0.052174,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.594 +/- 0.052 (in 3 folds),0.594 +/- 0.052 (in 3 folds),0.602 +/- 0.132 (in 3 folds),0.602 +/- 0.132 (in 3 folds),0.659 +/- 0.078 (in 3 folds),0.298 +/- 0.044 (in 3 folds),0.661,0.36,0.625 +/- 0.073 (in 3 folds),0.227 +/- 0.096 (in 3 folds),...,Unknown,109,6,115,0.052174,False,,,,
ridge_cv,0.587 +/- 0.064 (in 3 folds),0.587 +/- 0.064 (in 3 folds),0.638 +/- 0.099 (in 3 folds),0.638 +/- 0.099 (in 3 folds),0.393 +/- 0.084 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.393,-0.234,0.384 +/- 0.092 (in 3 folds),0.046 +/- 0.041 (in 3 folds),...,Unknown,112,3,115,0.026087,False,0.567 +/- 0.000 (in 1 folds),0.567 +/- 0.000 (in 1 folds),0.630 +/- 0.000 (in 1 folds),0.630 +/- 0.000 (in 1 folds)
ridge_cv.decision_thresholds_tuned,0.587 +/- 0.064 (in 3 folds),0.587 +/- 0.064 (in 3 folds),0.638 +/- 0.099 (in 3 folds),0.638 +/- 0.099 (in 3 folds),0.519 +/- 0.154 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.518,0.032,0.505 +/- 0.141 (in 3 folds),-0.006 +/- 0.069 (in 3 folds),...,Unknown,112,3,115,0.026087,False,0.567 +/- 0.000 (in 1 folds),0.567 +/- 0.000 (in 1 folds),0.630 +/- 0.000 (in 1 folds),0.630 +/- 0.000 (in 1 folds)
lasso_cv,0.533 +/- 0.044 (in 3 folds),0.533 +/- 0.044 (in 3 folds),0.551 +/- 0.186 (in 3 folds),0.551 +/- 0.186 (in 3 folds),0.523 +/- 0.015 (in 3 folds),0.176 +/- 0.111 (in 3 folds),0.523,0.045,0.495 +/- 0.015 (in 3 folds),0.144 +/- 0.117 (in 3 folds),...,Unknown,109,6,115,0.052174,False,,,,
lasso_cv.decision_thresholds_tuned,0.533 +/- 0.044 (in 3 folds),0.533 +/- 0.044 (in 3 folds),0.551 +/- 0.186 (in 3 folds),0.551 +/- 0.186 (in 3 folds),0.551 +/- 0.018 (in 3 folds),0.245 +/- 0.086 (in 3 folds),0.55,0.101,0.522 +/- 0.016 (in 3 folds),0.211 +/- 0.076 (in 3 folds),...,Unknown,109,6,115,0.052174,False,,,,
rf_multiclass,0.524 +/- 0.035 (in 3 folds),0.524 +/- 0.035 (in 3 folds),0.540 +/- 0.143 (in 3 folds),0.540 +/- 0.143 (in 3 folds),0.528 +/- 0.078 (in 3 folds),0.148 +/- 0.066 (in 3 folds),0.548,0.101,0.401 +/- 0.199 (in 3 folds),0.112 +/- 0.088 (in 3 folds),...,Unknown,84,31,115,0.269565,False,,,,
rf_multiclass.decision_thresholds_tuned,0.524 +/- 0.035 (in 3 folds),0.524 +/- 0.035 (in 3 folds),0.540 +/- 0.143 (in 3 folds),0.540 +/- 0.143 (in 3 folds),0.528 +/- 0.078 (in 3 folds),0.148 +/- 0.066 (in 3 folds),0.548,0.101,0.401 +/- 0.199 (in 3 folds),0.112 +/- 0.088 (in 3 folds),...,Unknown,84,31,115,0.269565,False,,,,


2022-12-31 20:14:52,329 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.0.test.h5ad -> /srv/scratch/maximz/cache/a6c3ab8bb9960154ff8dbb5d04eaf7a1c395f034f82f9649aefc9d35.0.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2022-12-31 21:08:05,818 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 55 specimens




2022-12-31 21:25:44,602 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 41 specimens




2022-12-31 21:46:08,163 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 52 specimens




2022-12-31 22:07:46,645 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 19 specimens (862171 rows)


2022-12-31 22:08:14,302 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 64 specimens




2022-12-31 22:23:16,861 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (6847 rows)


2022-12-31 22:23:47,089 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens




2022-12-31 22:39:24,527 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (6847 rows)


2022-12-31 22:39:54,627 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens




2022-12-31 22:54:40,550 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 74 specimens


2022-12-31 23:07:44,192 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.1.test.h5ad -> /srv/scratch/maximz/cache/d3eb18b805f6482478ad1ee75a5249a449864d796469d3e144db1326.1.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2022-12-31 23:57:41,171 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 54 specimens




2023-01-01 00:15:14,902 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 41 specimens




2023-01-01 00:35:12,634 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 53 specimens




2023-01-01 00:55:47,116 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 20 specimens (891618 rows)


2023-01-01 00:56:13,207 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 69 specimens




2023-01-01 01:10:50,757 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (11386 rows)


2023-01-01 01:11:23,861 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens




2023-01-01 01:25:33,601 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (11386 rows)


2023-01-01 01:26:06,272 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens




2023-01-01 01:39:51,380 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 74 specimens


2023-01-01 01:51:56,165 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.2.test.h5ad -> /srv/scratch/maximz/cache/d74a0f1a51ad1e35ec4654f627621ecdc4abf48e3481e399db8af384.2.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2023-01-01 02:56:24,458 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 53 specimens




2023-01-01 03:13:39,643 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 40 specimens




2023-01-01 03:33:35,924 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 51 specimens




2023-01-01 03:54:02,569 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 14 specimens (388281 rows)


2023-01-01 03:54:44,231 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 62 specimens




2023-01-01 04:13:23,142 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 2 specimens (96214 rows)


2023-01-01 04:13:54,268 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 71 specimens




2023-01-01 04:29:59,322 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 2 specimens (96214 rows)


2023-01-01 04:30:28,081 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 71 specimens




2023-01-01 04:46:19,300 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 72 specimens


GeneLocus.TCR TargetObsColumnEnum.disease --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/disease


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,...,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.894 +/- 0.019 (in 3 folds),0.905 +/- 0.018 (in 3 folds),0.871 +/- 0.026 (in 3 folds),0.889 +/- 0.024 (in 3 folds),0.534 +/- 0.081 (in 3 folds),0.214 +/- 0.215 (in 3 folds),0.534,0.264,disease.separate_past_exposures,,...,,,,,,414,0,414,0.0,False
ridge_cv.decision_thresholds_tuned,0.894 +/- 0.019 (in 3 folds),0.905 +/- 0.018 (in 3 folds),0.871 +/- 0.026 (in 3 folds),0.889 +/- 0.024 (in 3 folds),0.674 +/- 0.060 (in 3 folds),0.555 +/- 0.088 (in 3 folds),0.674,0.549,disease.separate_past_exposures,,...,,,,,,414,0,414,0.0,False
linearsvm_ovr,0.893 +/- 0.012 (in 3 folds),0.896 +/- 0.014 (in 3 folds),0.894 +/- 0.015 (in 3 folds),0.902 +/- 0.015 (in 3 folds),0.713 +/- 0.022 (in 3 folds),0.577 +/- 0.028 (in 3 folds),0.713,0.574,disease.separate_past_exposures,,...,,,,,,414,0,414,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.893 +/- 0.012 (in 3 folds),0.896 +/- 0.014 (in 3 folds),0.894 +/- 0.015 (in 3 folds),0.902 +/- 0.015 (in 3 folds),0.722 +/- 0.025 (in 3 folds),0.613 +/- 0.038 (in 3 folds),0.722,0.607,disease.separate_past_exposures,,...,,,,,,414,0,414,0.0,False
lasso_multiclass,0.885 +/- 0.005 (in 3 folds),0.886 +/- 0.004 (in 3 folds),0.879 +/- 0.011 (in 3 folds),0.884 +/- 0.011 (in 3 folds),0.702 +/- 0.016 (in 3 folds),0.575 +/- 0.023 (in 3 folds),0.702,0.569,disease.separate_past_exposures,0.701 +/- 0.017 (in 3 folds),...,0.7,0.567,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False
lasso_multiclass.decision_thresholds_tuned,0.885 +/- 0.005 (in 3 folds),0.886 +/- 0.004 (in 3 folds),0.879 +/- 0.011 (in 3 folds),0.884 +/- 0.011 (in 3 folds),0.724 +/- 0.036 (in 3 folds),0.612 +/- 0.045 (in 3 folds),0.724,0.61,disease.separate_past_exposures,0.723 +/- 0.038 (in 3 folds),...,0.722,0.607,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False
xgboost,0.883 +/- 0.003 (in 3 folds),0.882 +/- 0.005 (in 3 folds),0.876 +/- 0.008 (in 3 folds),0.880 +/- 0.006 (in 3 folds),0.714 +/- 0.011 (in 3 folds),0.572 +/- 0.015 (in 3 folds),0.714,0.571,disease.separate_past_exposures,0.713 +/- 0.012 (in 3 folds),...,0.713,0.569,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False
xgboost.decision_thresholds_tuned,0.883 +/- 0.003 (in 3 folds),0.882 +/- 0.005 (in 3 folds),0.876 +/- 0.008 (in 3 folds),0.880 +/- 0.006 (in 3 folds),0.705 +/- 0.030 (in 3 folds),0.568 +/- 0.041 (in 3 folds),0.705,0.566,disease.separate_past_exposures,0.703 +/- 0.030 (in 3 folds),...,0.703,0.564,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False
rf_multiclass,0.881 +/- 0.011 (in 3 folds),0.882 +/- 0.010 (in 3 folds),0.873 +/- 0.012 (in 3 folds),0.877 +/- 0.010 (in 3 folds),0.705 +/- 0.048 (in 3 folds),0.558 +/- 0.077 (in 3 folds),0.705,0.554,disease.separate_past_exposures,0.703 +/- 0.048 (in 3 folds),...,0.703,0.552,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False
rf_multiclass.decision_thresholds_tuned,0.881 +/- 0.011 (in 3 folds),0.882 +/- 0.010 (in 3 folds),0.873 +/- 0.012 (in 3 folds),0.877 +/- 0.010 (in 3 folds),0.717 +/- 0.048 (in 3 folds),0.585 +/- 0.074 (in 3 folds),0.717,0.583,disease.separate_past_exposures,0.715 +/- 0.049 (in 3 folds),...,0.715,0.581,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/disease/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.disease_all_demographics_present --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/disease_all_demographics_present


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,...,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_cv,0.879 +/- 0.020 (in 3 folds),0.882 +/- 0.025 (in 3 folds),0.850 +/- 0.023 (in 3 folds),0.858 +/- 0.030 (in 3 folds),0.615 +/- 0.079 (in 3 folds),0.411 +/- 0.098 (in 3 folds),0.615,0.407,disease.separate_past_exposures,0.611 +/- 0.077 (in 3 folds),...,0.612,0.404,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
lasso_cv.decision_thresholds_tuned,0.879 +/- 0.020 (in 3 folds),0.882 +/- 0.025 (in 3 folds),0.850 +/- 0.023 (in 3 folds),0.858 +/- 0.030 (in 3 folds),0.635 +/- 0.091 (in 3 folds),0.474 +/- 0.156 (in 3 folds),0.635,0.461,disease.separate_past_exposures,0.631 +/- 0.086 (in 3 folds),...,0.631,0.458,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
lasso_multiclass,0.876 +/- 0.016 (in 3 folds),0.877 +/- 0.017 (in 3 folds),0.859 +/- 0.025 (in 3 folds),0.865 +/- 0.030 (in 3 folds),0.682 +/- 0.044 (in 3 folds),0.550 +/- 0.050 (in 3 folds),0.683,0.548,disease.separate_past_exposures,0.679 +/- 0.047 (in 3 folds),...,0.679,0.544,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
lasso_multiclass.decision_thresholds_tuned,0.876 +/- 0.016 (in 3 folds),0.877 +/- 0.017 (in 3 folds),0.859 +/- 0.025 (in 3 folds),0.865 +/- 0.030 (in 3 folds),0.691 +/- 0.046 (in 3 folds),0.560 +/- 0.052 (in 3 folds),0.691,0.558,disease.separate_past_exposures,0.687 +/- 0.048 (in 3 folds),...,0.687,0.553,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
linearsvm_ovr,0.875 +/- 0.018 (in 3 folds),0.873 +/- 0.018 (in 3 folds),0.857 +/- 0.024 (in 3 folds),0.861 +/- 0.029 (in 3 folds),0.682 +/- 0.053 (in 3 folds),0.542 +/- 0.064 (in 3 folds),0.683,0.538,disease.separate_past_exposures,0.678 +/- 0.053 (in 3 folds),...,0.679,0.534,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
linearsvm_ovr.decision_thresholds_tuned,0.875 +/- 0.018 (in 3 folds),0.873 +/- 0.018 (in 3 folds),0.857 +/- 0.024 (in 3 folds),0.861 +/- 0.029 (in 3 folds),0.688 +/- 0.050 (in 3 folds),0.556 +/- 0.057 (in 3 folds),0.688,0.554,disease.separate_past_exposures,0.684 +/- 0.051 (in 3 folds),...,0.684,0.55,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
ridge_cv,0.874 +/- 0.028 (in 3 folds),0.879 +/- 0.032 (in 3 folds),0.836 +/- 0.031 (in 3 folds),0.847 +/- 0.038 (in 3 folds),0.519 +/- 0.123 (in 3 folds),0.155 +/- 0.269 (in 3 folds),0.52,0.24,disease.separate_past_exposures,0.516 +/- 0.125 (in 3 folds),...,0.517,0.238,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
ridge_cv.decision_thresholds_tuned,0.874 +/- 0.028 (in 3 folds),0.879 +/- 0.032 (in 3 folds),0.836 +/- 0.031 (in 3 folds),0.847 +/- 0.038 (in 3 folds),0.502 +/- 0.233 (in 3 folds),0.312 +/- 0.287 (in 3 folds),0.503,0.334,disease.separate_past_exposures,0.499 +/- 0.231 (in 3 folds),...,0.5,0.33,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
rf_multiclass,0.874 +/- 0.009 (in 3 folds),0.874 +/- 0.011 (in 3 folds),0.853 +/- 0.017 (in 3 folds),0.858 +/- 0.022 (in 3 folds),0.680 +/- 0.039 (in 3 folds),0.530 +/- 0.046 (in 3 folds),0.68,0.527,disease.separate_past_exposures,0.676 +/- 0.037 (in 3 folds),...,0.676,0.524,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
rf_multiclass.decision_thresholds_tuned,0.874 +/- 0.009 (in 3 folds),0.874 +/- 0.011 (in 3 folds),0.853 +/- 0.017 (in 3 folds),0.858 +/- 0.022 (in 3 folds),0.691 +/- 0.030 (in 3 folds),0.564 +/- 0.032 (in 3 folds),0.691,0.561,disease.separate_past_exposures,0.687 +/- 0.034 (in 3 folds),...,0.687,0.557,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/disease_all_demographics_present/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.covid_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/covid_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.955 +/- 0.002 (in 3 folds),0.955 +/- 0.002 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.893 +/- 0.013 (in 3 folds),0.729 +/- 0.048 (in 3 folds),0.893,0.726,disease.separate_past_exposures,252,0,252,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.955 +/- 0.002 (in 3 folds),0.955 +/- 0.002 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.897 +/- 0.008 (in 3 folds),0.759 +/- 0.009 (in 3 folds),0.897,0.755,disease.separate_past_exposures,252,0,252,0.0,False
linearsvm_ovr,0.955 +/- 0.001 (in 3 folds),0.955 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.881 +/- 0.025 (in 3 folds),0.720 +/- 0.025 (in 3 folds),0.881,0.715,disease.separate_past_exposures,252,0,252,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.955 +/- 0.001 (in 3 folds),0.955 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.889 +/- 0.015 (in 3 folds),0.720 +/- 0.031 (in 3 folds),0.889,0.718,disease.separate_past_exposures,252,0,252,0.0,False
xgboost,0.953 +/- 0.009 (in 3 folds),0.953 +/- 0.009 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.889 +/- 0.029 (in 3 folds),0.675 +/- 0.085 (in 3 folds),0.889,0.674,disease.separate_past_exposures,252,0,252,0.0,False
xgboost.decision_thresholds_tuned,0.953 +/- 0.009 (in 3 folds),0.953 +/- 0.009 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.877 +/- 0.017 (in 3 folds),0.671 +/- 0.075 (in 3 folds),0.877,0.669,disease.separate_past_exposures,252,0,252,0.0,False
ridge_cv,0.952 +/- 0.012 (in 3 folds),0.952 +/- 0.012 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.770 +/- 0.005 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.77,0.0,disease.separate_past_exposures,252,0,252,0.0,True
ridge_cv.decision_thresholds_tuned,0.952 +/- 0.012 (in 3 folds),0.952 +/- 0.012 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.825 +/- 0.091 (in 3 folds),0.274 +/- 0.475 (in 3 folds),0.825,0.433,disease.separate_past_exposures,252,0,252,0.0,False
lasso_cv,0.951 +/- 0.013 (in 3 folds),0.951 +/- 0.013 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.826 +/- 0.057 (in 3 folds),0.411 +/- 0.244 (in 3 folds),0.825,0.434,disease.separate_past_exposures,252,0,252,0.0,False
lasso_cv.decision_thresholds_tuned,0.951 +/- 0.013 (in 3 folds),0.951 +/- 0.013 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.909 +/- 0.019 (in 3 folds),0.791 +/- 0.030 (in 3 folds),0.909,0.789,disease.separate_past_exposures,252,0,252,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/covid_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.hiv_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/hiv_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,...,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.894 +/- 0.048 (in 3 folds),0.894 +/- 0.048 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.780 +/- 0.017 (in 3 folds),0.518 +/- 0.070 (in 3 folds),0.78,0.488,disease.separate_past_exposures,0.777 +/- 0.015 (in 3 folds),...,0.777,0.485,0.003,Unknown,disease.separate_past_exposures,291,1,292,0.003425,False
linearsvm_ovr.decision_thresholds_tuned,0.894 +/- 0.048 (in 3 folds),0.894 +/- 0.048 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.787 +/- 0.071 (in 3 folds),0.611 +/- 0.067 (in 3 folds),0.787,0.585,disease.separate_past_exposures,0.785 +/- 0.072 (in 3 folds),...,0.784,0.58,0.003,Unknown,disease.separate_past_exposures,291,1,292,0.003425,False
lasso_cv,0.890 +/- 0.031 (in 3 folds),0.890 +/- 0.031 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.774 +/- 0.039 (in 3 folds),0.468 +/- 0.102 (in 3 folds),0.774,0.466,disease.separate_past_exposures,,...,,,,,,292,0,292,0.0,False
lasso_cv.decision_thresholds_tuned,0.890 +/- 0.031 (in 3 folds),0.890 +/- 0.031 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.785 +/- 0.091 (in 3 folds),0.591 +/- 0.121 (in 3 folds),0.784,0.565,disease.separate_past_exposures,,...,,,,,,292,0,292,0.0,False
elasticnet_cv,0.887 +/- 0.035 (in 3 folds),0.887 +/- 0.035 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.781 +/- 0.041 (in 3 folds),0.482 +/- 0.109 (in 3 folds),0.781,0.483,disease.separate_past_exposures,,...,,,,,,292,0,292,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.887 +/- 0.035 (in 3 folds),0.887 +/- 0.035 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.785 +/- 0.086 (in 3 folds),0.586 +/- 0.129 (in 3 folds),0.784,0.561,disease.separate_past_exposures,,...,,,,,,292,0,292,0.0,False
lasso_multiclass,0.883 +/- 0.026 (in 3 folds),0.883 +/- 0.026 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.790 +/- 0.042 (in 3 folds),0.541 +/- 0.051 (in 3 folds),0.791,0.528,disease.separate_past_exposures,0.778 +/- 0.064 (in 3 folds),...,0.777,0.51,0.017,Unknown,disease.separate_past_exposures,287,5,292,0.017123,False
lasso_multiclass.decision_thresholds_tuned,0.883 +/- 0.026 (in 3 folds),0.883 +/- 0.026 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.784 +/- 0.046 (in 3 folds),0.548 +/- 0.111 (in 3 folds),0.784,0.543,disease.separate_past_exposures,0.771 +/- 0.065 (in 3 folds),...,0.771,0.524,0.017,Unknown,disease.separate_past_exposures,287,5,292,0.017123,False
ridge_cv,0.848 +/- 0.065 (in 3 folds),0.848 +/- 0.065 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.677 +/- 0.019 (in 3 folds),0.075 +/- 0.129 (in 3 folds),0.677,0.117,disease.separate_past_exposures,0.661 +/- 0.007 (in 3 folds),...,0.661,0.115,0.024,Unknown,disease.separate_past_exposures,285,7,292,0.023973,False
ridge_cv.decision_thresholds_tuned,0.848 +/- 0.065 (in 3 folds),0.848 +/- 0.065 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.685 +/- 0.031 (in 3 folds),0.132 +/- 0.229 (in 3 folds),0.684,0.183,disease.separate_past_exposures,0.668 +/- 0.015 (in 3 folds),...,0.668,0.177,0.024,Unknown,disease.separate_past_exposures,285,7,292,0.023973,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/hiv_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.lupus_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/lupus_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,...,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
rf_multiclass,0.871 +/- 0.044 (in 3 folds),0.871 +/- 0.044 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.850 +/- 0.010 (in 3 folds),0.592 +/- 0.047 (in 3 folds),0.85,0.587,disease.separate_past_exposures,0.837 +/- 0.022 (in 3 folds),...,disease.separate_past_exposures,254,4,258,0.015504,False,0.889 +/- 0.000 (in 1 folds),0.889 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds)
rf_multiclass.decision_thresholds_tuned,0.871 +/- 0.044 (in 3 folds),0.871 +/- 0.044 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.838 +/- 0.029 (in 3 folds),0.550 +/- 0.135 (in 3 folds),0.839,0.548,disease.separate_past_exposures,0.825 +/- 0.042 (in 3 folds),...,disease.separate_past_exposures,254,4,258,0.015504,False,0.889 +/- 0.000 (in 1 folds),0.889 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds)
xgboost,0.868 +/- 0.039 (in 3 folds),0.868 +/- 0.039 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.824 +/- 0.019 (in 3 folds),0.501 +/- 0.031 (in 3 folds),0.824,0.492,disease.separate_past_exposures,0.814 +/- 0.022 (in 3 folds),...,disease.separate_past_exposures,255,3,258,0.011628,False,0.889 +/- 0.023 (in 2 folds),0.889 +/- 0.023 (in 2 folds),0.786 +/- 0.013 (in 2 folds),0.786 +/- 0.013 (in 2 folds)
xgboost.decision_thresholds_tuned,0.868 +/- 0.039 (in 3 folds),0.868 +/- 0.039 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.842 +/- 0.035 (in 3 folds),0.539 +/- 0.121 (in 3 folds),0.843,0.546,disease.separate_past_exposures,0.833 +/- 0.050 (in 3 folds),...,disease.separate_past_exposures,255,3,258,0.011628,False,0.889 +/- 0.023 (in 2 folds),0.889 +/- 0.023 (in 2 folds),0.786 +/- 0.013 (in 2 folds),0.786 +/- 0.013 (in 2 folds)
elasticnet_cv,0.838 +/- 0.023 (in 3 folds),0.838 +/- 0.023 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.766 +/- 0.019 (in 3 folds),0.181 +/- 0.156 (in 3 folds),0.766,0.218,disease.separate_past_exposures,0.760 +/- 0.022 (in 3 folds),...,disease.separate_past_exposures,256,2,258,0.007752,False,0.827 +/- 0.000 (in 1 folds),0.827 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds)
elasticnet_cv.decision_thresholds_tuned,0.838 +/- 0.023 (in 3 folds),0.838 +/- 0.023 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.805 +/- 0.070 (in 3 folds),0.497 +/- 0.144 (in 3 folds),0.805,0.479,disease.separate_past_exposures,0.798 +/- 0.065 (in 3 folds),...,disease.separate_past_exposures,256,2,258,0.007752,False,0.827 +/- 0.000 (in 1 folds),0.827 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds)
lasso_cv,0.837 +/- 0.032 (in 3 folds),0.837 +/- 0.032 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.820 +/- 0.042 (in 3 folds),0.457 +/- 0.143 (in 3 folds),0.82,0.461,disease.separate_past_exposures,0.810 +/- 0.027 (in 3 folds),...,disease.separate_past_exposures,255,3,258,0.011628,False,0.848 +/- 0.038 (in 2 folds),0.848 +/- 0.038 (in 2 folds),0.733 +/- 0.111 (in 2 folds),0.733 +/- 0.111 (in 2 folds)
lasso_cv.decision_thresholds_tuned,0.837 +/- 0.032 (in 3 folds),0.837 +/- 0.032 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.824 +/- 0.079 (in 3 folds),0.538 +/- 0.158 (in 3 folds),0.824,0.509,disease.separate_past_exposures,0.814 +/- 0.073 (in 3 folds),...,disease.separate_past_exposures,255,3,258,0.011628,False,0.848 +/- 0.038 (in 2 folds),0.848 +/- 0.038 (in 2 folds),0.733 +/- 0.111 (in 2 folds),0.733 +/- 0.111 (in 2 folds)
lasso_multiclass,0.835 +/- 0.027 (in 3 folds),0.835 +/- 0.027 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.830 +/- 0.041 (in 3 folds),0.552 +/- 0.085 (in 3 folds),0.83,0.548,disease.separate_past_exposures,0.814 +/- 0.051 (in 3 folds),...,disease.separate_past_exposures,253,5,258,0.01938,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.835 +/- 0.027 (in 3 folds),0.835 +/- 0.027 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.830 +/- 0.030 (in 3 folds),0.524 +/- 0.079 (in 3 folds),0.83,0.524,disease.separate_past_exposures,0.814 +/- 0.040 (in 3 folds),...,disease.separate_past_exposures,253,5,258,0.01938,False,,,,


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/lupus_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.ethnicity_condensed_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/ethnicity_condensed_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.671 +/- 0.043 (in 3 folds),0.676 +/- 0.028 (in 3 folds),0.706 +/- 0.049 (in 3 folds),0.703 +/- 0.055 (in 3 folds),0.674 +/- 0.078 (in 3 folds),0.395 +/- 0.083 (in 3 folds),0.677,0.394,0.670 +/- 0.082 (in 3 folds),0.391 +/- 0.091 (in 3 folds),...,0.724 +/- 0.059 (in 2 folds),0.673,0.389,0.006,Unknown,164,1,165,0.006061,True
lasso_multiclass.decision_thresholds_tuned,0.671 +/- 0.043 (in 3 folds),0.676 +/- 0.028 (in 3 folds),0.706 +/- 0.049 (in 3 folds),0.703 +/- 0.055 (in 3 folds),0.632 +/- 0.101 (in 3 folds),0.331 +/- 0.119 (in 3 folds),0.634,0.321,0.629 +/- 0.106 (in 3 folds),0.332 +/- 0.117 (in 3 folds),...,0.724 +/- 0.059 (in 2 folds),0.63,0.32,0.006,Unknown,164,1,165,0.006061,True
lasso_cv,0.635 +/- 0.047 (in 3 folds),0.673 +/- 0.041 (in 3 folds),0.676 +/- 0.041 (in 3 folds),0.693 +/- 0.040 (in 3 folds),0.666 +/- 0.018 (in 3 folds),0.292 +/- 0.257 (in 3 folds),0.667,0.375,0.632 +/- 0.068 (in 3 folds),0.222 +/- 0.263 (in 3 folds),...,0.688 +/- 0.000 (in 1 folds),0.63,0.284,0.055,Unknown,156,9,165,0.054545,True
lasso_cv.decision_thresholds_tuned,0.635 +/- 0.047 (in 3 folds),0.673 +/- 0.041 (in 3 folds),0.676 +/- 0.041 (in 3 folds),0.693 +/- 0.040 (in 3 folds),0.644 +/- 0.051 (in 3 folds),0.375 +/- 0.147 (in 3 folds),0.641,0.323,0.609 +/- 0.061 (in 3 folds),0.313 +/- 0.146 (in 3 folds),...,0.688 +/- 0.000 (in 1 folds),0.606,0.278,0.055,Unknown,156,9,165,0.054545,True
elasticnet_cv,0.629 +/- 0.034 (in 3 folds),0.636 +/- 0.034 (in 3 folds),0.675 +/- 0.019 (in 3 folds),0.671 +/- 0.009 (in 3 folds),0.635 +/- 0.050 (in 3 folds),0.227 +/- 0.203 (in 3 folds),0.637,0.285,0.604 +/- 0.066 (in 3 folds),0.171 +/- 0.152 (in 3 folds),...,0.672 +/- 0.013 (in 2 folds),0.606,0.203,0.048,Unknown,157,8,165,0.048485,True
elasticnet_cv.decision_thresholds_tuned,0.629 +/- 0.034 (in 3 folds),0.636 +/- 0.034 (in 3 folds),0.675 +/- 0.019 (in 3 folds),0.671 +/- 0.009 (in 3 folds),0.666 +/- 0.040 (in 3 folds),0.367 +/- 0.058 (in 3 folds),0.669,0.37,0.635 +/- 0.079 (in 3 folds),0.312 +/- 0.093 (in 3 folds),...,0.672 +/- 0.013 (in 2 folds),0.636,0.32,0.048,Unknown,157,8,165,0.048485,True
linearsvm_ovr,0.622 +/- 0.028 (in 3 folds),0.623 +/- 0.036 (in 3 folds),0.669 +/- 0.009 (in 3 folds),0.660 +/- 0.018 (in 3 folds),0.669 +/- 0.098 (in 3 folds),0.389 +/- 0.112 (in 3 folds),0.675,0.381,0.662 +/- 0.105 (in 3 folds),0.372 +/- 0.129 (in 3 folds),...,0.671 +/- 0.000 (in 1 folds),0.667,0.362,0.012,Unknown,163,2,165,0.012121,True
linearsvm_ovr.decision_thresholds_tuned,0.622 +/- 0.028 (in 3 folds),0.623 +/- 0.036 (in 3 folds),0.669 +/- 0.009 (in 3 folds),0.660 +/- 0.018 (in 3 folds),0.635 +/- 0.068 (in 3 folds),0.334 +/- 0.067 (in 3 folds),0.638,0.304,0.628 +/- 0.074 (in 3 folds),0.318 +/- 0.062 (in 3 folds),...,0.671 +/- 0.000 (in 1 folds),0.63,0.296,0.012,Unknown,163,2,165,0.012121,True
rf_multiclass,0.606 +/- 0.054 (in 3 folds),0.612 +/- 0.042 (in 3 folds),0.630 +/- 0.020 (in 3 folds),0.620 +/- 0.006 (in 3 folds),0.674 +/- 0.038 (in 3 folds),0.374 +/- 0.085 (in 3 folds),0.675,0.382,0.652 +/- 0.052 (in 3 folds),0.341 +/- 0.042 (in 3 folds),...,0.622 +/- 0.000 (in 1 folds),0.655,0.342,0.03,Unknown,160,5,165,0.030303,True
rf_multiclass.decision_thresholds_tuned,0.606 +/- 0.054 (in 3 folds),0.612 +/- 0.042 (in 3 folds),0.630 +/- 0.020 (in 3 folds),0.620 +/- 0.006 (in 3 folds),0.499 +/- 0.271 (in 3 folds),0.306 +/- 0.189 (in 3 folds),0.481,0.152,0.477 +/- 0.252 (in 3 folds),0.274 +/- 0.153 (in 3 folds),...,0.622 +/- 0.000 (in 1 folds),0.467,0.146,0.03,Unknown,160,5,165,0.030303,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/ethnicity_condensed_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv












GeneLocus.TCR TargetObsColumnEnum.age_group_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/age_group_healthy_only
























































































































































































































































































































Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,...,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention
rf_multiclass,0.664 +/- 0.011 (in 3 folds),0.658 +/- 0.004 (in 3 folds),0.682 +/- 0.014 (in 3 folds),0.674 +/- 0.022 (in 3 folds),0.353 +/- 0.041 (in 3 folds),0.278 +/- 0.012 (in 3 folds),0.352,0.216,165,0,...,,,,,,,,,,
rf_multiclass.decision_thresholds_tuned,0.664 +/- 0.011 (in 3 folds),0.658 +/- 0.004 (in 3 folds),0.682 +/- 0.014 (in 3 folds),0.674 +/- 0.022 (in 3 folds),0.284 +/- 0.019 (in 3 folds),0.235 +/- 0.058 (in 3 folds),0.285,0.147,165,0,...,,,,,,,,,,
elasticnet_cv,0.642 +/- 0.015 (in 3 folds),0.624 +/- 0.027 (in 3 folds),0.666 +/- 0.031 (in 3 folds),0.652 +/- 0.041 (in 3 folds),0.216 +/- 0.074 (in 3 folds),0.189 +/- 0.093 (in 3 folds),0.212,0.053,165,0,...,,,,,,,,,,
elasticnet_cv.decision_thresholds_tuned,0.642 +/- 0.015 (in 3 folds),0.624 +/- 0.027 (in 3 folds),0.666 +/- 0.031 (in 3 folds),0.652 +/- 0.041 (in 3 folds),0.367 +/- 0.064 (in 3 folds),0.254 +/- 0.090 (in 3 folds),0.364,0.223,165,0,...,,,,,,,,,,
ridge_cv,0.640 +/- 0.042 (in 3 folds),0.623 +/- 0.027 (in 3 folds),0.664 +/- 0.007 (in 3 folds),0.650 +/- 0.014 (in 3 folds),0.186 +/- 0.038 (in 3 folds),0.105 +/- 0.112 (in 3 folds),0.182,-0.004,159,6,...,0.615 +/- 0.033 (in 2 folds),0.660 +/- 0.003 (in 2 folds),0.647 +/- 0.019 (in 2 folds),0.177 +/- 0.024 (in 3 folds),0.124 +/- 0.087 (in 3 folds),0.120 +/- 0.000 (in 1 folds),0.176,-0.004,0.036,Unknown
ridge_cv.decision_thresholds_tuned,0.640 +/- 0.042 (in 3 folds),0.623 +/- 0.027 (in 3 folds),0.664 +/- 0.007 (in 3 folds),0.650 +/- 0.014 (in 3 folds),0.296 +/- 0.060 (in 3 folds),0.137 +/- 0.119 (in 3 folds),0.302,0.148,159,6,...,0.615 +/- 0.033 (in 2 folds),0.660 +/- 0.003 (in 2 folds),0.647 +/- 0.019 (in 2 folds),0.287 +/- 0.076 (in 3 folds),0.157 +/- 0.085 (in 3 folds),0.120 +/- 0.000 (in 1 folds),0.291,0.145,0.036,Unknown
lasso_cv,0.637 +/- 0.024 (in 3 folds),0.619 +/- 0.010 (in 3 folds),0.670 +/- 0.018 (in 3 folds),0.657 +/- 0.027 (in 3 folds),0.227 +/- 0.046 (in 3 folds),0.210 +/- 0.030 (in 3 folds),0.224,0.073,165,0,...,,,,,,,,,,
lasso_cv.decision_thresholds_tuned,0.637 +/- 0.024 (in 3 folds),0.619 +/- 0.010 (in 3 folds),0.670 +/- 0.018 (in 3 folds),0.657 +/- 0.027 (in 3 folds),0.344 +/- 0.102 (in 3 folds),0.271 +/- 0.092 (in 3 folds),0.339,0.213,165,0,...,,,,,,,,,,
linearsvm_ovr,0.623 +/- 0.054 (in 3 folds),0.605 +/- 0.057 (in 3 folds),0.661 +/- 0.052 (in 3 folds),0.648 +/- 0.056 (in 3 folds),0.344 +/- 0.053 (in 3 folds),0.252 +/- 0.030 (in 3 folds),0.34,0.195,162,3,...,0.583 +/- 0.059 (in 2 folds),0.638 +/- 0.047 (in 2 folds),0.626 +/- 0.058 (in 2 folds),0.336 +/- 0.039 (in 3 folds),0.246 +/- 0.026 (in 3 folds),0.060 +/- 0.000 (in 1 folds),0.333,0.192,0.018,Unknown
linearsvm_ovr.decision_thresholds_tuned,0.623 +/- 0.054 (in 3 folds),0.605 +/- 0.057 (in 3 folds),0.661 +/- 0.052 (in 3 folds),0.648 +/- 0.056 (in 3 folds),0.368 +/- 0.081 (in 3 folds),0.261 +/- 0.056 (in 3 folds),0.364,0.237,162,3,...,0.583 +/- 0.059 (in 2 folds),0.638 +/- 0.047 (in 2 folds),0.626 +/- 0.058 (in 2 folds),0.360 +/- 0.068 (in 3 folds),0.256 +/- 0.050 (in 3 folds),0.060 +/- 0.000 (in 1 folds),0.358,0.231,0.018,Unknown


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/age_group_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.age_group_binary_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/age_group_binary_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,...,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.715 +/- 0.105 (in 3 folds),0.715 +/- 0.105 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.671 +/- 0.086 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.651,0.0,,,...,0.232 +/- 0.341 (in 3 folds),0.497,0.004,0.236,Unknown,126,39,165,0.236364,True
ridge_cv.decision_thresholds_tuned,0.715 +/- 0.105 (in 3 folds),0.715 +/- 0.105 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.631 +/- 0.149 (in 3 folds),-0.061 +/- 0.106 (in 3 folds),0.603,-0.068,,,...,0.232 +/- 0.341 (in 3 folds),0.461,-0.028,0.236,Unknown,126,39,165,0.236364,False
lasso_cv,0.710 +/- 0.101 (in 3 folds),0.710 +/- 0.101 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.631 +/- 0.149 (in 3 folds),-0.061 +/- 0.106 (in 3 folds),0.603,-0.068,,,...,0.232 +/- 0.341 (in 3 folds),0.461,-0.028,0.236,Unknown,126,39,165,0.236364,False
lasso_cv.decision_thresholds_tuned,0.710 +/- 0.101 (in 3 folds),0.710 +/- 0.101 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.571 +/- 0.165 (in 3 folds),0.036 +/- 0.240 (in 3 folds),0.524,0.035,,,...,0.232 +/- 0.341 (in 3 folds),0.4,0.023,0.236,Unknown,126,39,165,0.236364,False
elasticnet_cv,0.708 +/- 0.097 (in 3 folds),0.708 +/- 0.097 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.651 +/- 0.116 (in 3 folds),-0.034 +/- 0.059 (in 3 folds),0.627,-0.032,,,...,0.232 +/- 0.341 (in 3 folds),0.479,-0.009,0.236,Unknown,126,39,165,0.236364,False
elasticnet_cv.decision_thresholds_tuned,0.708 +/- 0.097 (in 3 folds),0.708 +/- 0.097 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.565 +/- 0.170 (in 3 folds),0.029 +/- 0.228 (in 3 folds),0.516,0.023,,,...,0.232 +/- 0.341 (in 3 folds),0.394,0.016,0.236,Unknown,126,39,165,0.236364,False
linearsvm_ovr,0.705 +/- 0.095 (in 3 folds),0.705 +/- 0.095 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.635 +/- 0.147 (in 3 folds),0.168 +/- 0.309 (in 3 folds),0.642,0.178,0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),...,0.027 +/- 0.010 (in 2 folds),0.63,0.17,0.018,Unknown,162,3,165,0.018182,False
linearsvm_ovr.decision_thresholds_tuned,0.705 +/- 0.095 (in 3 folds),0.705 +/- 0.095 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.593 +/- 0.122 (in 3 folds),0.144 +/- 0.289 (in 3 folds),0.599,0.145,0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),...,0.027 +/- 0.010 (in 2 folds),0.588,0.14,0.018,Unknown,162,3,165,0.018182,False
lasso_multiclass,0.673 +/- 0.092 (in 3 folds),0.673 +/- 0.092 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.643 +/- 0.099 (in 3 folds),0.187 +/- 0.227 (in 3 folds),0.648,0.195,0.711 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),...,0.027 +/- 0.010 (in 2 folds),0.636,0.187,0.018,Unknown,162,3,165,0.018182,False
lasso_multiclass.decision_thresholds_tuned,0.673 +/- 0.092 (in 3 folds),0.673 +/- 0.092 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.552 +/- 0.071 (in 3 folds),0.110 +/- 0.254 (in 3 folds),0.556,0.101,0.711 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),...,0.027 +/- 0.010 (in 2 folds),0.545,0.098,0.018,Unknown,162,3,165,0.018182,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/age_group_binary_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.sex_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/sex_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,...,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.590 +/- 0.065 (in 3 folds),0.590 +/- 0.065 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.549 +/- 0.062 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.547,0.071,0.537 +/- 0.075 (in 3 folds),0.001 +/- 0.001 (in 3 folds),...,0.683 +/- 0.015 (in 2 folds),0.533,0.068,0.024,Unknown,161,4,165,0.024242,False
ridge_cv.decision_thresholds_tuned,0.590 +/- 0.065 (in 3 folds),0.590 +/- 0.065 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.531 +/- 0.077 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.528,0.033,0.520 +/- 0.088 (in 3 folds),-0.001 +/- 0.001 (in 3 folds),...,0.683 +/- 0.015 (in 2 folds),0.515,0.032,0.024,Unknown,161,4,165,0.024242,False
linearsvm_ovr,0.548 +/- 0.095 (in 3 folds),0.548 +/- 0.095 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.594 +/- 0.085 (in 3 folds),0.154 +/- 0.158 (in 3 folds),0.593,0.158,0.585 +/- 0.099 (in 3 folds),0.162 +/- 0.144 (in 3 folds),...,0.643 +/- 0.065 (in 2 folds),0.582,0.161,0.018,Unknown,162,3,165,0.018182,False
linearsvm_ovr.decision_thresholds_tuned,0.548 +/- 0.095 (in 3 folds),0.548 +/- 0.095 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.592 +/- 0.051 (in 3 folds),0.177 +/- 0.133 (in 3 folds),0.593,0.16,0.580 +/- 0.035 (in 3 folds),0.176 +/- 0.131 (in 3 folds),...,0.643 +/- 0.065 (in 2 folds),0.582,0.161,0.018,Unknown,162,3,165,0.018182,False
lasso_multiclass,0.510 +/- 0.074 (in 3 folds),0.510 +/- 0.074 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.546 +/- 0.064 (in 3 folds),0.025 +/- 0.047 (in 3 folds),0.545,0.055,0.520 +/- 0.088 (in 3 folds),0.030 +/- 0.037 (in 3 folds),...,0.693 +/- 0.000 (in 1 folds),0.515,0.06,0.055,Unknown,156,9,165,0.054545,False
lasso_multiclass.decision_thresholds_tuned,0.510 +/- 0.074 (in 3 folds),0.510 +/- 0.074 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.590 +/- 0.048 (in 3 folds),0.217 +/- 0.071 (in 3 folds),0.59,0.14,0.560 +/- 0.060 (in 3 folds),0.196 +/- 0.083 (in 3 folds),...,0.693 +/- 0.000 (in 1 folds),0.558,0.142,0.055,Unknown,156,9,165,0.054545,False
elasticnet_cv,0.505 +/- 0.087 (in 3 folds),0.505 +/- 0.087 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.498 +/- 0.027 (in 3 folds),-0.016 +/- 0.049 (in 3 folds),0.5,-0.028,0.472 +/- 0.041 (in 3 folds),-0.017 +/- 0.041 (in 3 folds),...,0.706 +/- 0.000 (in 1 folds),0.473,-0.022,0.055,Unknown,156,9,165,0.054545,False
elasticnet_cv.decision_thresholds_tuned,0.505 +/- 0.087 (in 3 folds),0.505 +/- 0.087 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.520 +/- 0.017 (in 3 folds),-0.053 +/- 0.169 (in 3 folds),0.519,-0.096,0.492 +/- 0.015 (in 3 folds),-0.057 +/- 0.136 (in 3 folds),...,0.706 +/- 0.000 (in 1 folds),0.491,-0.05,0.055,Unknown,156,9,165,0.054545,False
lasso_cv,0.477 +/- 0.056 (in 3 folds),0.477 +/- 0.056 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.526 +/- 0.051 (in 3 folds),0.034 +/- 0.114 (in 3 folds),0.529,0.05,0.494 +/- 0.047 (in 3 folds),0.055 +/- 0.103 (in 3 folds),...,,0.497,0.046,0.061,Unknown,155,10,165,0.060606,False
lasso_cv.decision_thresholds_tuned,0.477 +/- 0.056 (in 3 folds),0.477 +/- 0.056 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.551 +/- 0.078 (in 3 folds),0.108 +/- 0.160 (in 3 folds),0.555,0.112,0.518 +/- 0.075 (in 3 folds),0.102 +/- 0.155 (in 3 folds),...,,0.521,0.099,0.061,Unknown,155,10,165,0.060606,False


/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/sex_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv
