# Tune "train-smaller" repertoire stats model decision thresholds on validation set, and report performance (with and without tuning) on test set

This is run using train-smaller+validation+test, not train+test sets.

Use trained model APIs to do this.

In [1]:
from malid import config
from malid.train.training_utils import (
    evaluate_original_and_tuned_on_test_set,
    tune_on_validation_set,
)
from malid.trained_model_wrappers import RepertoireClassifier
from malid.datamodels import (
    combine_classification_option_names,
)

In [2]:
# Run
for gene_locus in config.gene_loci_used:
    map_targets_to_output_dir = {
        target_obs_column: (
            config.paths.repertoire_stats_classifier_output_dir
            / gene_locus.name
            / combine_classification_option_names(target_obs_column)
        )  # output base dir should already exist
        for target_obs_column in config.classification_targets
    }
    print(gene_locus)
    clfs = tune_on_validation_set(
        gene_locus=gene_locus,
        targets=map_targets_to_output_dir,
        model_names=[
            "lasso_multiclass",
            "lasso_cv",
            "ridge_cv",
            "elasticnet_cv",
            "rf_multiclass",
            "xgboost",
            "linearsvm_ovr",
        ],
        model_class=RepertoireClassifier,
    )
    evaluate_original_and_tuned_on_test_set(
        clfs=clfs, gene_locus=gene_locus, targets=map_targets_to_output_dir
    )

2022-12-30 23:37:26,740 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.0.validation.h5ad -> /srv/scratch/maximz/cache/1a7cd102c4a71eb472da3636203a91984ec407adbc0812ffba2c07c5.0.validation.h5ad


GeneLocus.BCR
Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-30 23:45:37,324 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 46 specimens




2022-12-30 23:47:39,640 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 40 specimens




2022-12-30 23:49:59,990 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 36 specimens




2022-12-30 23:52:35,148 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 12 specimens (365758 rows)


2022-12-30 23:52:45,023 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 56 specimens




2022-12-30 23:54:49,562 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 2 specimens (20035 rows)


2022-12-30 23:55:00,505 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 60 specimens




2022-12-30 23:57:38,971 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 2 specimens (20035 rows)


2022-12-30 23:57:49,488 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 60 specimens




2022-12-30 23:59:48,891 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtered to specimens with defined sex column - removed 1 specimens (13078 rows)


2022-12-30 23:59:59,716 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 61 specimens


2022-12-31 00:01:15,877 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.1.validation.h5ad -> /srv/scratch/maximz/cache/9c85c2a266a883a684e8c5d509b8321d4689380ae1339b1d3a20c9e8.1.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 00:08:47,479 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 42 specimens




2022-12-31 00:10:47,056 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 33 specimens




2022-12-31 00:13:12,604 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 35 specimens




2022-12-31 00:16:25,796 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 11 specimens (332120 rows)


2022-12-31 00:16:36,196 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 48 specimens




2022-12-31 00:18:43,009 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (5035 rows)


2022-12-31 00:18:53,964 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 54 specimens




2022-12-31 00:21:29,247 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (5035 rows)


2022-12-31 00:21:39,584 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 54 specimens




2022-12-31 00:23:30,839 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 55 specimens


2022-12-31 00:24:41,600 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.2.validation.h5ad -> /srv/scratch/maximz/cache/08c1068072d49c0e446bca7b2515cc6904c1583e869886f65b95c2db.2.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 00:32:53,332 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 44 specimens




2022-12-31 00:35:14,302 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 37 specimens




2022-12-31 00:37:42,925 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 35 specimens




2022-12-31 00:40:34,602 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 13 specimens (345033 rows)


2022-12-31 00:40:51,416 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 51 specimens




2022-12-31 00:44:05,529 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 3 specimens (59403 rows)


2022-12-31 00:44:18,899 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 56 specimens




2022-12-31 00:48:33,497 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 3 specimens (59403 rows)


2022-12-31 00:48:46,344 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 56 specimens




2022-12-31 00:51:09,466 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtered to specimens with defined sex column - removed 2 specimens (35834 rows)


2022-12-31 00:51:22,354 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 57 specimens


2022-12-31 00:52:47,898 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.-1.validation.h5ad -> /srv/scratch/maximz/cache/d12efe0f72cdefa66ff3f9089960fc16b89c64c2837b4b81d55fb8ed.-1.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 01:05:08,593 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 66 specimens




2022-12-31 01:07:47,272 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 53 specimens




2022-12-31 01:10:12,607 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 53 specimens




2022-12-31 01:12:58,580 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 20 specimens (485965 rows)


2022-12-31 01:16:34,518 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 75 specimens
IOStream.flush timed out




2022-12-31 01:28:47,510 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 2 specimens (35185 rows)


2022-12-31 01:29:08,576 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 84 specimens




2022-12-31 01:40:06,417 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 2 specimens (35185 rows)


2022-12-31 01:40:27,227 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 84 specimens




2022-12-31 01:43:29,498 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtered to specimens with defined sex column - removed 1 specimens (11616 rows)


2022-12-31 01:43:50,176 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 85 specimens


GeneLocus.BCR TargetObsColumnEnum.disease


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.938 +/- 0.014 (in 3 folds),0.940 +/- 0.016 (in 3 folds),0.937 +/- 0.017 (in 3 folds),0.941 +/- 0.018 (in 3 folds),0.805 +/- 0.023 (in 3 folds),0.719 +/- 0.031 (in 3 folds),0.805,0.718,323,0,323,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.938 +/- 0.014 (in 3 folds),0.940 +/- 0.016 (in 3 folds),0.937 +/- 0.017 (in 3 folds),0.941 +/- 0.018 (in 3 folds),0.845 +/- 0.002 (in 3 folds),0.776 +/- 0.006 (in 3 folds),0.845,0.773,323,0,323,0.0,False
rf_multiclass,0.922 +/- 0.008 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.929 +/- 0.008 (in 3 folds),0.932 +/- 0.010 (in 3 folds),0.768 +/- 0.051 (in 3 folds),0.659 +/- 0.068 (in 3 folds),0.768,0.658,323,0,323,0.0,False
rf_multiclass.decision_thresholds_tuned,0.922 +/- 0.008 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.929 +/- 0.008 (in 3 folds),0.932 +/- 0.010 (in 3 folds),0.839 +/- 0.020 (in 3 folds),0.767 +/- 0.028 (in 3 folds),0.839,0.765,323,0,323,0.0,False
linearsvm_ovr,0.918 +/- 0.010 (in 3 folds),0.918 +/- 0.014 (in 3 folds),0.916 +/- 0.014 (in 3 folds),0.920 +/- 0.016 (in 3 folds),0.783 +/- 0.005 (in 3 folds),0.685 +/- 0.011 (in 3 folds),0.783,0.683,323,0,323,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.918 +/- 0.010 (in 3 folds),0.918 +/- 0.014 (in 3 folds),0.916 +/- 0.014 (in 3 folds),0.920 +/- 0.016 (in 3 folds),0.830 +/- 0.005 (in 3 folds),0.754 +/- 0.007 (in 3 folds),0.83,0.75,323,0,323,0.0,False
xgboost,0.910 +/- 0.029 (in 3 folds),0.909 +/- 0.031 (in 3 folds),0.918 +/- 0.029 (in 3 folds),0.922 +/- 0.031 (in 3 folds),0.783 +/- 0.019 (in 3 folds),0.682 +/- 0.031 (in 3 folds),0.783,0.681,323,0,323,0.0,False
xgboost.decision_thresholds_tuned,0.910 +/- 0.029 (in 3 folds),0.909 +/- 0.031 (in 3 folds),0.918 +/- 0.029 (in 3 folds),0.922 +/- 0.031 (in 3 folds),0.823 +/- 0.010 (in 3 folds),0.740 +/- 0.014 (in 3 folds),0.824,0.739,323,0,323,0.0,False
ridge_cv,0.907 +/- 0.019 (in 3 folds),0.900 +/- 0.024 (in 3 folds),0.907 +/- 0.022 (in 3 folds),0.906 +/- 0.027 (in 3 folds),0.575 +/- 0.202 (in 3 folds),0.238 +/- 0.412 (in 3 folds),0.576,0.358,323,0,323,0.0,False
ridge_cv.decision_thresholds_tuned,0.907 +/- 0.019 (in 3 folds),0.900 +/- 0.024 (in 3 folds),0.907 +/- 0.022 (in 3 folds),0.906 +/- 0.027 (in 3 folds),0.793 +/- 0.083 (in 3 folds),0.698 +/- 0.114 (in 3 folds),0.793,0.695,323,0,323,0.0,False


GeneLocus.BCR TargetObsColumnEnum.disease_all_demographics_present


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.938 +/- 0.012 (in 3 folds),0.939 +/- 0.012 (in 3 folds),0.938 +/- 0.015 (in 3 folds),0.941 +/- 0.014 (in 3 folds),0.800 +/- 0.008 (in 3 folds),0.708 +/- 0.007 (in 3 folds),0.8,0.707,285,0,285,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.938 +/- 0.012 (in 3 folds),0.939 +/- 0.012 (in 3 folds),0.938 +/- 0.015 (in 3 folds),0.941 +/- 0.014 (in 3 folds),0.842 +/- 0.029 (in 3 folds),0.775 +/- 0.034 (in 3 folds),0.842,0.769,285,0,285,0.0,False
rf_multiclass,0.918 +/- 0.004 (in 3 folds),0.918 +/- 0.006 (in 3 folds),0.923 +/- 0.004 (in 3 folds),0.926 +/- 0.003 (in 3 folds),0.748 +/- 0.062 (in 3 folds),0.629 +/- 0.075 (in 3 folds),0.747,0.626,285,0,285,0.0,False
rf_multiclass.decision_thresholds_tuned,0.918 +/- 0.004 (in 3 folds),0.918 +/- 0.006 (in 3 folds),0.923 +/- 0.004 (in 3 folds),0.926 +/- 0.003 (in 3 folds),0.818 +/- 0.042 (in 3 folds),0.742 +/- 0.037 (in 3 folds),0.818,0.733,285,0,285,0.0,False
xgboost,0.913 +/- 0.018 (in 3 folds),0.911 +/- 0.018 (in 3 folds),0.925 +/- 0.015 (in 3 folds),0.927 +/- 0.014 (in 3 folds),0.754 +/- 0.032 (in 3 folds),0.640 +/- 0.038 (in 3 folds),0.754,0.635,285,0,285,0.0,False
xgboost.decision_thresholds_tuned,0.913 +/- 0.018 (in 3 folds),0.911 +/- 0.018 (in 3 folds),0.925 +/- 0.015 (in 3 folds),0.927 +/- 0.014 (in 3 folds),0.824 +/- 0.008 (in 3 folds),0.742 +/- 0.018 (in 3 folds),0.825,0.74,285,0,285,0.0,False
linearsvm_ovr,0.912 +/- 0.010 (in 3 folds),0.910 +/- 0.010 (in 3 folds),0.908 +/- 0.007 (in 3 folds),0.910 +/- 0.010 (in 3 folds),0.772 +/- 0.048 (in 3 folds),0.668 +/- 0.064 (in 3 folds),0.772,0.664,285,0,285,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.912 +/- 0.010 (in 3 folds),0.910 +/- 0.010 (in 3 folds),0.908 +/- 0.007 (in 3 folds),0.910 +/- 0.010 (in 3 folds),0.814 +/- 0.029 (in 3 folds),0.735 +/- 0.033 (in 3 folds),0.814,0.724,285,0,285,0.0,False
ridge_cv,0.910 +/- 0.015 (in 3 folds),0.903 +/- 0.022 (in 3 folds),0.911 +/- 0.018 (in 3 folds),0.910 +/- 0.024 (in 3 folds),0.654 +/- 0.159 (in 3 folds),0.421 +/- 0.375 (in 3 folds),0.656,0.498,285,0,285,0.0,False
ridge_cv.decision_thresholds_tuned,0.910 +/- 0.015 (in 3 folds),0.903 +/- 0.022 (in 3 folds),0.911 +/- 0.018 (in 3 folds),0.910 +/- 0.024 (in 3 folds),0.720 +/- 0.197 (in 3 folds),0.507 +/- 0.440 (in 3 folds),0.723,0.586,285,0,285,0.0,False


GeneLocus.BCR TargetObsColumnEnum.covid_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.963 +/- 0.007 (in 3 folds),0.963 +/- 0.007 (in 3 folds),0.986 +/- 0.004 (in 3 folds),0.986 +/- 0.004 (in 3 folds),0.948 +/- 0.010 (in 3 folds),0.844 +/- 0.040 (in 3 folds),0.948,0.844,191,0,191,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.963 +/- 0.007 (in 3 folds),0.963 +/- 0.007 (in 3 folds),0.986 +/- 0.004 (in 3 folds),0.986 +/- 0.004 (in 3 folds),0.974 +/- 0.009 (in 3 folds),0.923 +/- 0.027 (in 3 folds),0.974,0.923,191,0,191,0.0,False
elasticnet_cv,0.954 +/- 0.023 (in 3 folds),0.954 +/- 0.023 (in 3 folds),0.983 +/- 0.011 (in 3 folds),0.983 +/- 0.011 (in 3 folds),0.822 +/- 0.058 (in 3 folds),0.227 +/- 0.394 (in 3 folds),0.822,0.394,191,0,191,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.954 +/- 0.023 (in 3 folds),0.954 +/- 0.023 (in 3 folds),0.983 +/- 0.011 (in 3 folds),0.983 +/- 0.011 (in 3 folds),0.953 +/- 0.016 (in 3 folds),0.861 +/- 0.055 (in 3 folds),0.953,0.86,191,0,191,0.0,False
linearsvm_ovr,0.950 +/- 0.024 (in 3 folds),0.950 +/- 0.024 (in 3 folds),0.980 +/- 0.012 (in 3 folds),0.980 +/- 0.012 (in 3 folds),0.947 +/- 0.025 (in 3 folds),0.843 +/- 0.084 (in 3 folds),0.948,0.844,191,0,191,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.950 +/- 0.024 (in 3 folds),0.950 +/- 0.024 (in 3 folds),0.980 +/- 0.012 (in 3 folds),0.980 +/- 0.012 (in 3 folds),0.953 +/- 0.028 (in 3 folds),0.862 +/- 0.084 (in 3 folds),0.953,0.864,191,0,191,0.0,False
rf_multiclass,0.948 +/- 0.031 (in 3 folds),0.948 +/- 0.031 (in 3 folds),0.972 +/- 0.019 (in 3 folds),0.972 +/- 0.019 (in 3 folds),0.921 +/- 0.017 (in 3 folds),0.760 +/- 0.061 (in 3 folds),0.921,0.762,191,0,191,0.0,False
rf_multiclass.decision_thresholds_tuned,0.948 +/- 0.031 (in 3 folds),0.948 +/- 0.031 (in 3 folds),0.972 +/- 0.019 (in 3 folds),0.972 +/- 0.019 (in 3 folds),0.958 +/- 0.010 (in 3 folds),0.880 +/- 0.026 (in 3 folds),0.958,0.88,191,0,191,0.0,False
xgboost,0.946 +/- 0.026 (in 3 folds),0.946 +/- 0.026 (in 3 folds),0.967 +/- 0.035 (in 3 folds),0.967 +/- 0.035 (in 3 folds),0.942 +/- 0.010 (in 3 folds),0.829 +/- 0.031 (in 3 folds),0.942,0.827,191,0,191,0.0,False
xgboost.decision_thresholds_tuned,0.946 +/- 0.026 (in 3 folds),0.946 +/- 0.026 (in 3 folds),0.967 +/- 0.035 (in 3 folds),0.967 +/- 0.035 (in 3 folds),0.958 +/- 0.025 (in 3 folds),0.878 +/- 0.074 (in 3 folds),0.958,0.878,191,0,191,0.0,False


GeneLocus.BCR TargetObsColumnEnum.hiv_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
xgboost,0.966 +/- 0.010 (in 3 folds),0.966 +/- 0.010 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.897 +/- 0.014 (in 3 folds),0.753 +/- 0.037 (in 3 folds),0.897,0.752,213,0,213,0.0,False
xgboost.decision_thresholds_tuned,0.966 +/- 0.010 (in 3 folds),0.966 +/- 0.010 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.920 +/- 0.006 (in 3 folds),0.819 +/- 0.011 (in 3 folds),0.92,0.818,213,0,213,0.0,False
lasso_cv,0.965 +/- 0.027 (in 3 folds),0.965 +/- 0.027 (in 3 folds),0.986 +/- 0.010 (in 3 folds),0.986 +/- 0.010 (in 3 folds),0.907 +/- 0.052 (in 3 folds),0.771 +/- 0.134 (in 3 folds),0.906,0.772,213,0,213,0.0,False
lasso_cv.decision_thresholds_tuned,0.965 +/- 0.027 (in 3 folds),0.965 +/- 0.027 (in 3 folds),0.986 +/- 0.010 (in 3 folds),0.986 +/- 0.010 (in 3 folds),0.935 +/- 0.040 (in 3 folds),0.849 +/- 0.095 (in 3 folds),0.934,0.845,213,0,213,0.0,False
rf_multiclass,0.964 +/- 0.016 (in 3 folds),0.964 +/- 0.016 (in 3 folds),0.986 +/- 0.004 (in 3 folds),0.986 +/- 0.004 (in 3 folds),0.902 +/- 0.012 (in 3 folds),0.761 +/- 0.033 (in 3 folds),0.901,0.761,213,0,213,0.0,False
rf_multiclass.decision_thresholds_tuned,0.964 +/- 0.016 (in 3 folds),0.964 +/- 0.016 (in 3 folds),0.986 +/- 0.004 (in 3 folds),0.986 +/- 0.004 (in 3 folds),0.906 +/- 0.020 (in 3 folds),0.802 +/- 0.026 (in 3 folds),0.906,0.798,213,0,213,0.0,False
elasticnet_cv,0.963 +/- 0.024 (in 3 folds),0.963 +/- 0.024 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.902 +/- 0.036 (in 3 folds),0.759 +/- 0.096 (in 3 folds),0.901,0.76,213,0,213,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.963 +/- 0.024 (in 3 folds),0.963 +/- 0.024 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.925 +/- 0.044 (in 3 folds),0.831 +/- 0.093 (in 3 folds),0.925,0.823,213,0,213,0.0,False
lasso_multiclass,0.961 +/- 0.030 (in 3 folds),0.961 +/- 0.030 (in 3 folds),0.984 +/- 0.013 (in 3 folds),0.984 +/- 0.013 (in 3 folds),0.925 +/- 0.031 (in 3 folds),0.824 +/- 0.073 (in 3 folds),0.925,0.823,213,0,213,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.961 +/- 0.030 (in 3 folds),0.961 +/- 0.030 (in 3 folds),0.984 +/- 0.013 (in 3 folds),0.984 +/- 0.013 (in 3 folds),0.939 +/- 0.021 (in 3 folds),0.855 +/- 0.053 (in 3 folds),0.939,0.856,213,0,213,0.0,False


GeneLocus.BCR TargetObsColumnEnum.lupus_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.938 +/- 0.027 (in 3 folds),0.938 +/- 0.027 (in 3 folds),0.904 +/- 0.040 (in 3 folds),0.904 +/- 0.040 (in 3 folds),0.885 +/- 0.008 (in 3 folds),0.734 +/- 0.012 (in 3 folds),0.885,0.733,217,0,217,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.938 +/- 0.027 (in 3 folds),0.938 +/- 0.027 (in 3 folds),0.904 +/- 0.040 (in 3 folds),0.904 +/- 0.040 (in 3 folds),0.908 +/- 0.022 (in 3 folds),0.788 +/- 0.046 (in 3 folds),0.908,0.784,217,0,217,0.0,False
linearsvm_ovr,0.936 +/- 0.030 (in 3 folds),0.936 +/- 0.030 (in 3 folds),0.893 +/- 0.048 (in 3 folds),0.893 +/- 0.048 (in 3 folds),0.876 +/- 0.025 (in 3 folds),0.717 +/- 0.043 (in 3 folds),0.876,0.715,217,0,217,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.936 +/- 0.030 (in 3 folds),0.936 +/- 0.030 (in 3 folds),0.893 +/- 0.048 (in 3 folds),0.893 +/- 0.048 (in 3 folds),0.890 +/- 0.047 (in 3 folds),0.762 +/- 0.072 (in 3 folds),0.889,0.75,217,0,217,0.0,False
elasticnet_cv,0.934 +/- 0.022 (in 3 folds),0.934 +/- 0.022 (in 3 folds),0.905 +/- 0.036 (in 3 folds),0.905 +/- 0.036 (in 3 folds),0.885 +/- 0.021 (in 3 folds),0.725 +/- 0.044 (in 3 folds),0.885,0.725,217,0,217,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.934 +/- 0.022 (in 3 folds),0.934 +/- 0.022 (in 3 folds),0.905 +/- 0.036 (in 3 folds),0.905 +/- 0.036 (in 3 folds),0.908 +/- 0.028 (in 3 folds),0.787 +/- 0.059 (in 3 folds),0.908,0.782,217,0,217,0.0,False
ridge_cv,0.933 +/- 0.028 (in 3 folds),0.933 +/- 0.028 (in 3 folds),0.894 +/- 0.062 (in 3 folds),0.894 +/- 0.062 (in 3 folds),0.812 +/- 0.134 (in 3 folds),0.491 +/- 0.426 (in 3 folds),0.811,0.558,217,0,217,0.0,False
ridge_cv.decision_thresholds_tuned,0.933 +/- 0.028 (in 3 folds),0.933 +/- 0.028 (in 3 folds),0.894 +/- 0.062 (in 3 folds),0.894 +/- 0.062 (in 3 folds),0.840 +/- 0.158 (in 3 folds),0.556 +/- 0.483 (in 3 folds),0.839,0.622,217,0,217,0.0,False
lasso_cv,0.930 +/- 0.023 (in 3 folds),0.930 +/- 0.023 (in 3 folds),0.894 +/- 0.040 (in 3 folds),0.894 +/- 0.040 (in 3 folds),0.880 +/- 0.015 (in 3 folds),0.715 +/- 0.027 (in 3 folds),0.88,0.715,217,0,217,0.0,False
lasso_cv.decision_thresholds_tuned,0.930 +/- 0.023 (in 3 folds),0.930 +/- 0.023 (in 3 folds),0.894 +/- 0.040 (in 3 folds),0.894 +/- 0.040 (in 3 folds),0.903 +/- 0.028 (in 3 folds),0.771 +/- 0.064 (in 3 folds),0.903,0.771,217,0,217,0.0,False


GeneLocus.BCR TargetObsColumnEnum.ethnicity_condensed_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.746 +/- 0.009 (in 3 folds),0.739 +/- 0.009 (in 3 folds),0.771 +/- 0.012 (in 3 folds),0.769 +/- 0.006 (in 3 folds),0.460 +/- 0.112 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.462,0.0,132,0,132,0.0,True
elasticnet_cv.decision_thresholds_tuned,0.746 +/- 0.009 (in 3 folds),0.739 +/- 0.009 (in 3 folds),0.771 +/- 0.012 (in 3 folds),0.769 +/- 0.006 (in 3 folds),0.709 +/- 0.087 (in 3 folds),0.589 +/- 0.074 (in 3 folds),0.712,0.588,132,0,132,0.0,True
lasso_cv,0.741 +/- 0.009 (in 3 folds),0.735 +/- 0.010 (in 3 folds),0.772 +/- 0.015 (in 3 folds),0.772 +/- 0.008 (in 3 folds),0.460 +/- 0.112 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.462,0.0,132,0,132,0.0,True
lasso_cv.decision_thresholds_tuned,0.741 +/- 0.009 (in 3 folds),0.735 +/- 0.010 (in 3 folds),0.772 +/- 0.015 (in 3 folds),0.772 +/- 0.008 (in 3 folds),0.717 +/- 0.085 (in 3 folds),0.599 +/- 0.073 (in 3 folds),0.72,0.599,132,0,132,0.0,True
linearsvm_ovr,0.716 +/- 0.111 (in 3 folds),0.691 +/- 0.127 (in 3 folds),0.719 +/- 0.089 (in 3 folds),0.698 +/- 0.099 (in 3 folds),0.637 +/- 0.051 (in 3 folds),0.454 +/- 0.125 (in 3 folds),0.636,0.435,132,0,132,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.716 +/- 0.111 (in 3 folds),0.691 +/- 0.127 (in 3 folds),0.719 +/- 0.089 (in 3 folds),0.698 +/- 0.099 (in 3 folds),0.733 +/- 0.048 (in 3 folds),0.600 +/- 0.082 (in 3 folds),0.735,0.613,132,0,132,0.0,True
lasso_multiclass,0.696 +/- 0.143 (in 3 folds),0.671 +/- 0.165 (in 3 folds),0.738 +/- 0.113 (in 3 folds),0.721 +/- 0.133 (in 3 folds),0.542 +/- 0.126 (in 3 folds),0.288 +/- 0.201 (in 3 folds),0.545,0.309,132,0,132,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.696 +/- 0.143 (in 3 folds),0.671 +/- 0.165 (in 3 folds),0.738 +/- 0.113 (in 3 folds),0.721 +/- 0.133 (in 3 folds),0.733 +/- 0.044 (in 3 folds),0.612 +/- 0.056 (in 3 folds),0.735,0.62,132,0,132,0.0,True
rf_multiclass,0.670 +/- 0.036 (in 3 folds),0.616 +/- 0.022 (in 3 folds),0.692 +/- 0.008 (in 3 folds),0.653 +/- 0.006 (in 3 folds),0.658 +/- 0.094 (in 3 folds),0.517 +/- 0.069 (in 3 folds),0.659,0.513,132,0,132,0.0,True
rf_multiclass.decision_thresholds_tuned,0.670 +/- 0.036 (in 3 folds),0.616 +/- 0.022 (in 3 folds),0.692 +/- 0.008 (in 3 folds),0.653 +/- 0.006 (in 3 folds),0.748 +/- 0.061 (in 3 folds),0.640 +/- 0.040 (in 3 folds),0.75,0.641,132,0,132,0.0,True














GeneLocus.BCR TargetObsColumnEnum.age_group_healthy_only






































































































































































































































































































































Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.647 +/- 0.043 (in 3 folds),0.644 +/- 0.043 (in 3 folds),0.690 +/- 0.040 (in 3 folds),0.688 +/- 0.041 (in 3 folds),0.191 +/- 0.047 (in 3 folds),0.148 +/- 0.070 (in 3 folds),0.189,0.019,132,0,132,0.0,True
elasticnet_cv.decision_thresholds_tuned,0.647 +/- 0.043 (in 3 folds),0.644 +/- 0.043 (in 3 folds),0.690 +/- 0.040 (in 3 folds),0.688 +/- 0.041 (in 3 folds),0.434 +/- 0.096 (in 3 folds),0.348 +/- 0.111 (in 3 folds),0.432,0.331,132,0,132,0.0,True
lasso_cv,0.642 +/- 0.036 (in 3 folds),0.638 +/- 0.038 (in 3 folds),0.688 +/- 0.035 (in 3 folds),0.685 +/- 0.038 (in 3 folds),0.214 +/- 0.058 (in 3 folds),0.166 +/- 0.083 (in 3 folds),0.212,0.051,132,0,132,0.0,True
lasso_cv.decision_thresholds_tuned,0.642 +/- 0.036 (in 3 folds),0.638 +/- 0.038 (in 3 folds),0.688 +/- 0.035 (in 3 folds),0.685 +/- 0.038 (in 3 folds),0.426 +/- 0.088 (in 3 folds),0.338 +/- 0.102 (in 3 folds),0.424,0.321,132,0,132,0.0,True
ridge_cv,0.633 +/- 0.065 (in 3 folds),0.628 +/- 0.072 (in 3 folds),0.680 +/- 0.047 (in 3 folds),0.675 +/- 0.051 (in 3 folds),0.152 +/- 0.020 (in 3 folds),-0.003 +/- 0.006 (in 3 folds),0.152,-0.045,132,0,132,0.0,True
ridge_cv.decision_thresholds_tuned,0.633 +/- 0.065 (in 3 folds),0.628 +/- 0.072 (in 3 folds),0.680 +/- 0.047 (in 3 folds),0.675 +/- 0.051 (in 3 folds),0.380 +/- 0.049 (in 3 folds),0.322 +/- 0.021 (in 3 folds),0.379,0.252,132,0,132,0.0,True
lasso_multiclass,0.624 +/- 0.062 (in 3 folds),0.616 +/- 0.076 (in 3 folds),0.677 +/- 0.059 (in 3 folds),0.669 +/- 0.070 (in 3 folds),0.281 +/- 0.059 (in 3 folds),0.148 +/- 0.063 (in 3 folds),0.28,0.144,132,0,132,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.624 +/- 0.062 (in 3 folds),0.616 +/- 0.076 (in 3 folds),0.677 +/- 0.059 (in 3 folds),0.669 +/- 0.070 (in 3 folds),0.426 +/- 0.050 (in 3 folds),0.328 +/- 0.045 (in 3 folds),0.424,0.321,132,0,132,0.0,True
rf_multiclass,0.610 +/- 0.038 (in 3 folds),0.604 +/- 0.037 (in 3 folds),0.669 +/- 0.035 (in 3 folds),0.665 +/- 0.038 (in 3 folds),0.260 +/- 0.061 (in 3 folds),0.133 +/- 0.069 (in 3 folds),0.258,0.106,132,0,132,0.0,True
rf_multiclass.decision_thresholds_tuned,0.610 +/- 0.038 (in 3 folds),0.604 +/- 0.037 (in 3 folds),0.669 +/- 0.035 (in 3 folds),0.665 +/- 0.038 (in 3 folds),0.434 +/- 0.067 (in 3 folds),0.351 +/- 0.066 (in 3 folds),0.432,0.326,132,0,132,0.0,True


GeneLocus.BCR TargetObsColumnEnum.age_group_binary_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
rf_multiclass,0.684 +/- 0.097 (in 3 folds),0.684 +/- 0.097 (in 3 folds),0.793 +/- 0.104 (in 3 folds),0.793 +/- 0.104 (in 3 folds),0.691 +/- 0.071 (in 3 folds),0.274 +/- 0.255 (in 3 folds),0.689,0.247,132,0,132,0.0,False
rf_multiclass.decision_thresholds_tuned,0.684 +/- 0.097 (in 3 folds),0.684 +/- 0.097 (in 3 folds),0.793 +/- 0.104 (in 3 folds),0.793 +/- 0.104 (in 3 folds),0.714 +/- 0.055 (in 3 folds),0.406 +/- 0.145 (in 3 folds),0.712,0.353,132,0,132,0.0,False
xgboost,0.673 +/- 0.077 (in 3 folds),0.673 +/- 0.077 (in 3 folds),0.802 +/- 0.073 (in 3 folds),0.802 +/- 0.073 (in 3 folds),0.685 +/- 0.074 (in 3 folds),0.276 +/- 0.162 (in 3 folds),0.682,0.263,132,0,132,0.0,False
xgboost.decision_thresholds_tuned,0.673 +/- 0.077 (in 3 folds),0.673 +/- 0.077 (in 3 folds),0.802 +/- 0.073 (in 3 folds),0.802 +/- 0.073 (in 3 folds),0.687 +/- 0.164 (in 3 folds),0.456 +/- 0.142 (in 3 folds),0.682,0.359,132,0,132,0.0,False
lasso_multiclass,0.621 +/- 0.062 (in 3 folds),0.621 +/- 0.062 (in 3 folds),0.765 +/- 0.100 (in 3 folds),0.765 +/- 0.100 (in 3 folds),0.576 +/- 0.097 (in 3 folds),0.137 +/- 0.193 (in 3 folds),0.576,0.115,132,0,132,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.621 +/- 0.062 (in 3 folds),0.621 +/- 0.062 (in 3 folds),0.765 +/- 0.100 (in 3 folds),0.765 +/- 0.100 (in 3 folds),0.640 +/- 0.102 (in 3 folds),0.328 +/- 0.049 (in 3 folds),0.636,0.337,132,0,132,0.0,False
linearsvm_ovr,0.593 +/- 0.059 (in 3 folds),0.593 +/- 0.059 (in 3 folds),0.768 +/- 0.090 (in 3 folds),0.768 +/- 0.090 (in 3 folds),0.547 +/- 0.061 (in 3 folds),0.023 +/- 0.123 (in 3 folds),0.545,0.01,132,0,132,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.593 +/- 0.059 (in 3 folds),0.593 +/- 0.059 (in 3 folds),0.768 +/- 0.090 (in 3 folds),0.768 +/- 0.090 (in 3 folds),0.605 +/- 0.023 (in 3 folds),0.285 +/- 0.124 (in 3 folds),0.606,0.239,132,0,132,0.0,False
elasticnet_cv,0.539 +/- 0.080 (in 3 folds),0.539 +/- 0.080 (in 3 folds),0.706 +/- 0.070 (in 3 folds),0.706 +/- 0.070 (in 3 folds),0.654 +/- 0.077 (in 3 folds),0.037 +/- 0.142 (in 3 folds),0.652,0.025,132,0,132,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.539 +/- 0.080 (in 3 folds),0.539 +/- 0.080 (in 3 folds),0.706 +/- 0.070 (in 3 folds),0.706 +/- 0.070 (in 3 folds),0.624 +/- 0.124 (in 3 folds),0.164 +/- 0.187 (in 3 folds),0.621,0.231,132,0,132,0.0,False


GeneLocus.BCR TargetObsColumnEnum.sex_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_cv,0.516 +/- 0.123 (in 3 folds),0.516 +/- 0.123 (in 3 folds),0.502 +/- 0.213 (in 3 folds),0.502 +/- 0.213 (in 3 folds),0.441 +/- 0.063 (in 3 folds),0.045 +/- 0.084 (in 3 folds),0.439,-0.101,132,0,132,0.0,False
lasso_cv.decision_thresholds_tuned,0.516 +/- 0.123 (in 3 folds),0.516 +/- 0.123 (in 3 folds),0.502 +/- 0.213 (in 3 folds),0.502 +/- 0.213 (in 3 folds),0.556 +/- 0.209 (in 3 folds),0.222 +/- 0.225 (in 3 folds),0.553,0.148,132,0,132,0.0,False
xgboost,0.514 +/- 0.139 (in 3 folds),0.514 +/- 0.139 (in 3 folds),0.475 +/- 0.175 (in 3 folds),0.475 +/- 0.175 (in 3 folds),0.513 +/- 0.096 (in 3 folds),0.058 +/- 0.179 (in 3 folds),0.515,0.049,132,0,132,0.0,False
xgboost.decision_thresholds_tuned,0.514 +/- 0.139 (in 3 folds),0.514 +/- 0.139 (in 3 folds),0.475 +/- 0.175 (in 3 folds),0.475 +/- 0.175 (in 3 folds),0.581 +/- 0.101 (in 3 folds),0.282 +/- 0.118 (in 3 folds),0.583,0.233,132,0,132,0.0,False
rf_multiclass,0.507 +/- 0.142 (in 3 folds),0.507 +/- 0.142 (in 3 folds),0.499 +/- 0.203 (in 3 folds),0.499 +/- 0.203 (in 3 folds),0.468 +/- 0.060 (in 3 folds),0.007 +/- 0.157 (in 3 folds),0.47,-0.043,132,0,132,0.0,False
rf_multiclass.decision_thresholds_tuned,0.507 +/- 0.142 (in 3 folds),0.507 +/- 0.142 (in 3 folds),0.499 +/- 0.203 (in 3 folds),0.499 +/- 0.203 (in 3 folds),0.562 +/- 0.127 (in 3 folds),0.234 +/- 0.114 (in 3 folds),0.561,0.12,132,0,132,0.0,False
ridge_cv,0.480 +/- 0.034 (in 3 folds),0.480 +/- 0.034 (in 3 folds),0.454 +/- 0.151 (in 3 folds),0.454 +/- 0.151 (in 3 folds),0.418 +/- 0.039 (in 3 folds),-0.015 +/- 0.026 (in 3 folds),0.417,-0.157,132,0,132,0.0,False
ridge_cv.decision_thresholds_tuned,0.480 +/- 0.034 (in 3 folds),0.480 +/- 0.034 (in 3 folds),0.454 +/- 0.151 (in 3 folds),0.454 +/- 0.151 (in 3 folds),0.470 +/- 0.126 (in 3 folds),0.035 +/- 0.060 (in 3 folds),0.47,0.081,132,0,132,0.0,False
lasso_multiclass,0.475 +/- 0.125 (in 3 folds),0.475 +/- 0.125 (in 3 folds),0.496 +/- 0.214 (in 3 folds),0.496 +/- 0.214 (in 3 folds),0.491 +/- 0.114 (in 3 folds),0.002 +/- 0.207 (in 3 folds),0.492,-0.001,132,0,132,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.475 +/- 0.125 (in 3 folds),0.475 +/- 0.125 (in 3 folds),0.496 +/- 0.214 (in 3 folds),0.496 +/- 0.214 (in 3 folds),0.518 +/- 0.149 (in 3 folds),0.207 +/- 0.091 (in 3 folds),0.515,0.032,132,0,132,0.0,False


2022-12-31 01:47:06,452 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.0.test.h5ad -> /srv/scratch/maximz/cache/d23bdbcb1cb8d1c3007da595727fbbab8cc86779ab8967868314f2da.0.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2022-12-31 01:58:32,369 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 66 specimens




2022-12-31 02:01:30,904 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 53 specimens




2022-12-31 02:05:03,053 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 53 specimens




2022-12-31 02:09:48,993 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 20 specimens (485965 rows)


2022-12-31 02:13:21,066 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 75 specimens




2022-12-31 02:37:54,381 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 2 specimens (35185 rows)


2022-12-31 02:41:11,820 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 84 specimens




2022-12-31 02:48:34,919 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 2 specimens (35185 rows)
IOStream.flush timed out
2022-12-31 02:49:06,543 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 84 specimens
IOStream.flush timed out




2022-12-31 02:56:14,761 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtered to specimens with defined sex column - removed 1 specimens (11616 rows)


2022-12-31 02:56:37,463 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 85 specimens


2022-12-31 02:58:34,967 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.1.test.h5ad -> /srv/scratch/maximz/cache/ed1f2608e168c24c508b6bfbbe3a18ba1a4680e5c010e34cd184cae6.1.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2022-12-31 03:07:55,895 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 67 specimens




2022-12-31 03:10:26,705 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 56 specimens




2022-12-31 03:13:27,266 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 55 specimens




2022-12-31 03:16:32,417 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 23 specimens (507703 rows)


2022-12-31 03:18:19,185 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 82 specimens




2022-12-31 03:24:22,378 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 3 specimens (42791 rows)


2022-12-31 03:25:15,164 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 87 specimens




2022-12-31 03:35:07,531 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 3 specimens (42791 rows)


2022-12-31 03:35:25,494 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 87 specimens




2022-12-31 03:38:15,273 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtered to specimens with defined sex column - removed 2 specimens (35834 rows)


2022-12-31 03:38:31,917 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 88 specimens


2022-12-31 03:40:24,769 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/BCR/fold.2.test.h5ad -> /srv/scratch/maximz/cache/83dcd409138574af7b7b712ce14967e926c14170bff7801b141edb49.2.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2022-12-31 03:51:39,937 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 63 specimens




2022-12-31 03:54:21,026 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 52 specimens




2022-12-31 03:57:11,703 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 53 specimens




2022-12-31 04:00:14,509 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 14 specimens (363854 rows)


2022-12-31 04:02:54,833 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 74 specimens




2022-12-31 04:09:11,987 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 2 specimens (10728 rows)


2022-12-31 04:09:37,228 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 83 specimens




2022-12-31 04:19:25,665 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 2 specimens (10728 rows)


2022-12-31 04:19:43,823 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 83 specimens




2022-12-31 04:25:09,687 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 84 specimens


GeneLocus.BCR TargetObsColumnEnum.disease --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/disease


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.939 +/- 0.014 (in 3 folds),0.942 +/- 0.016 (in 3 folds),0.938 +/- 0.015 (in 3 folds),0.943 +/- 0.015 (in 3 folds),0.812 +/- 0.010 (in 3 folds),0.728 +/- 0.015 (in 3 folds),0.812,0.728,disease.separate_past_exposures,480,0,480,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.939 +/- 0.014 (in 3 folds),0.942 +/- 0.016 (in 3 folds),0.938 +/- 0.015 (in 3 folds),0.943 +/- 0.015 (in 3 folds),0.800 +/- 0.015 (in 3 folds),0.707 +/- 0.023 (in 3 folds),0.8,0.705,disease.separate_past_exposures,480,0,480,0.0,False
linearsvm_ovr,0.932 +/- 0.023 (in 3 folds),0.933 +/- 0.027 (in 3 folds),0.931 +/- 0.024 (in 3 folds),0.935 +/- 0.027 (in 3 folds),0.806 +/- 0.042 (in 3 folds),0.718 +/- 0.061 (in 3 folds),0.806,0.717,disease.separate_past_exposures,480,0,480,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.932 +/- 0.023 (in 3 folds),0.933 +/- 0.027 (in 3 folds),0.931 +/- 0.024 (in 3 folds),0.935 +/- 0.027 (in 3 folds),0.793 +/- 0.037 (in 3 folds),0.700 +/- 0.059 (in 3 folds),0.794,0.699,disease.separate_past_exposures,480,0,480,0.0,False
rf_multiclass,0.926 +/- 0.015 (in 3 folds),0.926 +/- 0.016 (in 3 folds),0.930 +/- 0.013 (in 3 folds),0.933 +/- 0.013 (in 3 folds),0.777 +/- 0.014 (in 3 folds),0.675 +/- 0.025 (in 3 folds),0.777,0.673,disease.separate_past_exposures,480,0,480,0.0,False
rf_multiclass.decision_thresholds_tuned,0.926 +/- 0.015 (in 3 folds),0.926 +/- 0.016 (in 3 folds),0.930 +/- 0.013 (in 3 folds),0.933 +/- 0.013 (in 3 folds),0.773 +/- 0.054 (in 3 folds),0.680 +/- 0.065 (in 3 folds),0.773,0.667,disease.separate_past_exposures,480,0,480,0.0,False
xgboost,0.919 +/- 0.006 (in 3 folds),0.918 +/- 0.007 (in 3 folds),0.923 +/- 0.004 (in 3 folds),0.926 +/- 0.004 (in 3 folds),0.761 +/- 0.024 (in 3 folds),0.648 +/- 0.037 (in 3 folds),0.76,0.645,disease.separate_past_exposures,480,0,480,0.0,False
xgboost.decision_thresholds_tuned,0.919 +/- 0.006 (in 3 folds),0.918 +/- 0.007 (in 3 folds),0.923 +/- 0.004 (in 3 folds),0.926 +/- 0.004 (in 3 folds),0.790 +/- 0.005 (in 3 folds),0.690 +/- 0.005 (in 3 folds),0.79,0.689,disease.separate_past_exposures,480,0,480,0.0,False
elasticnet_cv,0.902 +/- 0.023 (in 3 folds),0.897 +/- 0.026 (in 3 folds),0.903 +/- 0.023 (in 3 folds),0.902 +/- 0.024 (in 3 folds),0.786 +/- 0.022 (in 3 folds),0.687 +/- 0.032 (in 3 folds),0.785,0.686,disease.separate_past_exposures,480,0,480,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.902 +/- 0.023 (in 3 folds),0.897 +/- 0.026 (in 3 folds),0.903 +/- 0.023 (in 3 folds),0.902 +/- 0.024 (in 3 folds),0.750 +/- 0.038 (in 3 folds),0.646 +/- 0.038 (in 3 folds),0.75,0.637,disease.separate_past_exposures,480,0,480,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/disease/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.disease_all_demographics_present --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/disease_all_demographics_present


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.942 +/- 0.014 (in 3 folds),0.946 +/- 0.014 (in 3 folds),0.940 +/- 0.019 (in 3 folds),0.946 +/- 0.019 (in 3 folds),0.802 +/- 0.018 (in 3 folds),0.711 +/- 0.023 (in 3 folds),0.802,0.712,disease.separate_past_exposures,420,0,420,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.942 +/- 0.014 (in 3 folds),0.946 +/- 0.014 (in 3 folds),0.940 +/- 0.019 (in 3 folds),0.946 +/- 0.019 (in 3 folds),0.786 +/- 0.019 (in 3 folds),0.690 +/- 0.023 (in 3 folds),0.786,0.688,disease.separate_past_exposures,420,0,420,0.0,False
linearsvm_ovr,0.922 +/- 0.027 (in 3 folds),0.918 +/- 0.033 (in 3 folds),0.921 +/- 0.031 (in 3 folds),0.922 +/- 0.035 (in 3 folds),0.786 +/- 0.020 (in 3 folds),0.688 +/- 0.036 (in 3 folds),0.786,0.688,disease.separate_past_exposures,420,0,420,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.922 +/- 0.027 (in 3 folds),0.918 +/- 0.033 (in 3 folds),0.921 +/- 0.031 (in 3 folds),0.922 +/- 0.035 (in 3 folds),0.778 +/- 0.030 (in 3 folds),0.685 +/- 0.024 (in 3 folds),0.779,0.678,disease.separate_past_exposures,420,0,420,0.0,False
rf_multiclass,0.915 +/- 0.012 (in 3 folds),0.915 +/- 0.012 (in 3 folds),0.923 +/- 0.012 (in 3 folds),0.926 +/- 0.012 (in 3 folds),0.783 +/- 0.019 (in 3 folds),0.684 +/- 0.018 (in 3 folds),0.783,0.684,disease.separate_past_exposures,420,0,420,0.0,False
rf_multiclass.decision_thresholds_tuned,0.915 +/- 0.012 (in 3 folds),0.915 +/- 0.012 (in 3 folds),0.923 +/- 0.012 (in 3 folds),0.926 +/- 0.012 (in 3 folds),0.745 +/- 0.063 (in 3 folds),0.650 +/- 0.059 (in 3 folds),0.745,0.631,disease.separate_past_exposures,420,0,420,0.0,False
xgboost,0.912 +/- 0.015 (in 3 folds),0.913 +/- 0.015 (in 3 folds),0.921 +/- 0.017 (in 3 folds),0.926 +/- 0.016 (in 3 folds),0.779 +/- 0.019 (in 3 folds),0.674 +/- 0.024 (in 3 folds),0.779,0.674,disease.separate_past_exposures,420,0,420,0.0,False
xgboost.decision_thresholds_tuned,0.912 +/- 0.015 (in 3 folds),0.913 +/- 0.015 (in 3 folds),0.921 +/- 0.017 (in 3 folds),0.926 +/- 0.016 (in 3 folds),0.755 +/- 0.046 (in 3 folds),0.656 +/- 0.057 (in 3 folds),0.755,0.638,disease.separate_past_exposures,420,0,420,0.0,False
elasticnet_cv,0.907 +/- 0.013 (in 3 folds),0.903 +/- 0.019 (in 3 folds),0.910 +/- 0.018 (in 3 folds),0.910 +/- 0.023 (in 3 folds),0.802 +/- 0.023 (in 3 folds),0.711 +/- 0.029 (in 3 folds),0.802,0.71,disease.separate_past_exposures,420,0,420,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.907 +/- 0.013 (in 3 folds),0.903 +/- 0.019 (in 3 folds),0.910 +/- 0.018 (in 3 folds),0.910 +/- 0.023 (in 3 folds),0.760 +/- 0.038 (in 3 folds),0.659 +/- 0.038 (in 3 folds),0.76,0.652,disease.separate_past_exposures,420,0,420,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/disease_all_demographics_present/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.covid_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/covid_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
rf_multiclass,0.971 +/- 0.026 (in 3 folds),0.971 +/- 0.026 (in 3 folds),0.988 +/- 0.012 (in 3 folds),0.988 +/- 0.012 (in 3 folds),0.943 +/- 0.025 (in 3 folds),0.832 +/- 0.078 (in 3 folds),0.944,0.833,disease.separate_past_exposures,284,0,284,0.0,False
rf_multiclass.decision_thresholds_tuned,0.971 +/- 0.026 (in 3 folds),0.971 +/- 0.026 (in 3 folds),0.988 +/- 0.012 (in 3 folds),0.988 +/- 0.012 (in 3 folds),0.936 +/- 0.037 (in 3 folds),0.813 +/- 0.114 (in 3 folds),0.937,0.816,disease.separate_past_exposures,284,0,284,0.0,False
xgboost,0.964 +/- 0.034 (in 3 folds),0.964 +/- 0.034 (in 3 folds),0.987 +/- 0.014 (in 3 folds),0.987 +/- 0.014 (in 3 folds),0.919 +/- 0.040 (in 3 folds),0.770 +/- 0.105 (in 3 folds),0.919,0.762,disease.separate_past_exposures,284,0,284,0.0,False
xgboost.decision_thresholds_tuned,0.964 +/- 0.034 (in 3 folds),0.964 +/- 0.034 (in 3 folds),0.987 +/- 0.014 (in 3 folds),0.987 +/- 0.014 (in 3 folds),0.929 +/- 0.043 (in 3 folds),0.805 +/- 0.115 (in 3 folds),0.93,0.801,disease.separate_past_exposures,284,0,284,0.0,False
lasso_multiclass,0.960 +/- 0.037 (in 3 folds),0.960 +/- 0.037 (in 3 folds),0.985 +/- 0.014 (in 3 folds),0.985 +/- 0.014 (in 3 folds),0.957 +/- 0.039 (in 3 folds),0.872 +/- 0.117 (in 3 folds),0.958,0.875,disease.separate_past_exposures,284,0,284,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.960 +/- 0.037 (in 3 folds),0.960 +/- 0.037 (in 3 folds),0.985 +/- 0.014 (in 3 folds),0.985 +/- 0.014 (in 3 folds),0.950 +/- 0.027 (in 3 folds),0.852 +/- 0.083 (in 3 folds),0.951,0.854,disease.separate_past_exposures,284,0,284,0.0,False
lasso_cv,0.956 +/- 0.039 (in 3 folds),0.956 +/- 0.039 (in 3 folds),0.976 +/- 0.026 (in 3 folds),0.976 +/- 0.026 (in 3 folds),0.778 +/- 0.010 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.778,0.0,disease.separate_past_exposures,284,0,284,0.0,True
lasso_cv.decision_thresholds_tuned,0.956 +/- 0.039 (in 3 folds),0.956 +/- 0.039 (in 3 folds),0.976 +/- 0.026 (in 3 folds),0.976 +/- 0.026 (in 3 folds),0.915 +/- 0.056 (in 3 folds),0.758 +/- 0.159 (in 3 folds),0.915,0.755,disease.separate_past_exposures,284,0,284,0.0,False
elasticnet_cv,0.956 +/- 0.039 (in 3 folds),0.956 +/- 0.039 (in 3 folds),0.982 +/- 0.016 (in 3 folds),0.982 +/- 0.016 (in 3 folds),0.813 +/- 0.071 (in 3 folds),0.221 +/- 0.383 (in 3 folds),0.813,0.358,disease.separate_past_exposures,284,0,284,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.956 +/- 0.039 (in 3 folds),0.956 +/- 0.039 (in 3 folds),0.982 +/- 0.016 (in 3 folds),0.982 +/- 0.016 (in 3 folds),0.940 +/- 0.038 (in 3 folds),0.819 +/- 0.115 (in 3 folds),0.94,0.823,disease.separate_past_exposures,284,0,284,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/covid_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.hiv_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/hiv_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.982 +/- 0.009 (in 3 folds),0.982 +/- 0.009 (in 3 folds),0.992 +/- 0.003 (in 3 folds),0.992 +/- 0.003 (in 3 folds),0.938 +/- 0.018 (in 3 folds),0.855 +/- 0.040 (in 3 folds),0.937,0.854,disease.separate_past_exposures,319,0,319,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.982 +/- 0.009 (in 3 folds),0.982 +/- 0.009 (in 3 folds),0.992 +/- 0.003 (in 3 folds),0.992 +/- 0.003 (in 3 folds),0.931 +/- 0.013 (in 3 folds),0.840 +/- 0.027 (in 3 folds),0.931,0.839,disease.separate_past_exposures,319,0,319,0.0,False
lasso_cv,0.979 +/- 0.005 (in 3 folds),0.979 +/- 0.005 (in 3 folds),0.991 +/- 0.002 (in 3 folds),0.991 +/- 0.002 (in 3 folds),0.931 +/- 0.016 (in 3 folds),0.836 +/- 0.038 (in 3 folds),0.931,0.836,disease.separate_past_exposures,319,0,319,0.0,False
lasso_cv.decision_thresholds_tuned,0.979 +/- 0.005 (in 3 folds),0.979 +/- 0.005 (in 3 folds),0.991 +/- 0.002 (in 3 folds),0.991 +/- 0.002 (in 3 folds),0.915 +/- 0.032 (in 3 folds),0.809 +/- 0.061 (in 3 folds),0.915,0.804,disease.separate_past_exposures,319,0,319,0.0,False
elasticnet_cv,0.978 +/- 0.007 (in 3 folds),0.978 +/- 0.007 (in 3 folds),0.990 +/- 0.003 (in 3 folds),0.990 +/- 0.003 (in 3 folds),0.928 +/- 0.015 (in 3 folds),0.828 +/- 0.037 (in 3 folds),0.928,0.828,disease.separate_past_exposures,319,0,319,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.978 +/- 0.007 (in 3 folds),0.978 +/- 0.007 (in 3 folds),0.990 +/- 0.003 (in 3 folds),0.990 +/- 0.003 (in 3 folds),0.919 +/- 0.023 (in 3 folds),0.814 +/- 0.049 (in 3 folds),0.918,0.81,disease.separate_past_exposures,319,0,319,0.0,False
rf_multiclass,0.968 +/- 0.009 (in 3 folds),0.968 +/- 0.009 (in 3 folds),0.985 +/- 0.004 (in 3 folds),0.985 +/- 0.004 (in 3 folds),0.915 +/- 0.015 (in 3 folds),0.800 +/- 0.036 (in 3 folds),0.915,0.799,disease.separate_past_exposures,319,0,319,0.0,False
rf_multiclass.decision_thresholds_tuned,0.968 +/- 0.009 (in 3 folds),0.968 +/- 0.009 (in 3 folds),0.985 +/- 0.004 (in 3 folds),0.985 +/- 0.004 (in 3 folds),0.893 +/- 0.021 (in 3 folds),0.772 +/- 0.015 (in 3 folds),0.893,0.765,disease.separate_past_exposures,319,0,319,0.0,False
linearsvm_ovr,0.967 +/- 0.016 (in 3 folds),0.967 +/- 0.016 (in 3 folds),0.985 +/- 0.007 (in 3 folds),0.985 +/- 0.007 (in 3 folds),0.913 +/- 0.031 (in 3 folds),0.800 +/- 0.068 (in 3 folds),0.912,0.798,disease.separate_past_exposures,319,0,319,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.967 +/- 0.016 (in 3 folds),0.967 +/- 0.016 (in 3 folds),0.985 +/- 0.007 (in 3 folds),0.985 +/- 0.007 (in 3 folds),0.903 +/- 0.062 (in 3 folds),0.804 +/- 0.095 (in 3 folds),0.903,0.783,disease.separate_past_exposures,319,0,319,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/hiv_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.lupus_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/lupus_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.914 +/- 0.015 (in 3 folds),0.914 +/- 0.015 (in 3 folds),0.873 +/- 0.019 (in 3 folds),0.873 +/- 0.019 (in 3 folds),0.871 +/- 0.008 (in 3 folds),0.688 +/- 0.025 (in 3 folds),0.871,0.688,disease.separate_past_exposures,319,0,319,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.914 +/- 0.015 (in 3 folds),0.914 +/- 0.015 (in 3 folds),0.873 +/- 0.019 (in 3 folds),0.873 +/- 0.019 (in 3 folds),0.859 +/- 0.013 (in 3 folds),0.658 +/- 0.037 (in 3 folds),0.859,0.656,disease.separate_past_exposures,319,0,319,0.0,False
lasso_multiclass,0.914 +/- 0.010 (in 3 folds),0.914 +/- 0.010 (in 3 folds),0.867 +/- 0.017 (in 3 folds),0.867 +/- 0.017 (in 3 folds),0.850 +/- 0.014 (in 3 folds),0.655 +/- 0.022 (in 3 folds),0.85,0.653,disease.separate_past_exposures,319,0,319,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.914 +/- 0.010 (in 3 folds),0.914 +/- 0.010 (in 3 folds),0.867 +/- 0.017 (in 3 folds),0.867 +/- 0.017 (in 3 folds),0.843 +/- 0.019 (in 3 folds),0.629 +/- 0.041 (in 3 folds),0.843,0.626,disease.separate_past_exposures,319,0,319,0.0,False
ridge_cv,0.905 +/- 0.008 (in 3 folds),0.905 +/- 0.008 (in 3 folds),0.864 +/- 0.006 (in 3 folds),0.864 +/- 0.006 (in 3 folds),0.797 +/- 0.089 (in 3 folds),0.427 +/- 0.370 (in 3 folds),0.796,0.505,disease.separate_past_exposures,319,0,319,0.0,False
ridge_cv.decision_thresholds_tuned,0.905 +/- 0.008 (in 3 folds),0.905 +/- 0.008 (in 3 folds),0.864 +/- 0.006 (in 3 folds),0.864 +/- 0.006 (in 3 folds),0.807 +/- 0.097 (in 3 folds),0.445 +/- 0.386 (in 3 folds),0.806,0.515,disease.separate_past_exposures,319,0,319,0.0,False
lasso_cv,0.903 +/- 0.005 (in 3 folds),0.903 +/- 0.005 (in 3 folds),0.855 +/- 0.017 (in 3 folds),0.855 +/- 0.017 (in 3 folds),0.849 +/- 0.035 (in 3 folds),0.632 +/- 0.091 (in 3 folds),0.85,0.634,disease.separate_past_exposures,319,0,319,0.0,False
lasso_cv.decision_thresholds_tuned,0.903 +/- 0.005 (in 3 folds),0.903 +/- 0.005 (in 3 folds),0.855 +/- 0.017 (in 3 folds),0.855 +/- 0.017 (in 3 folds),0.846 +/- 0.029 (in 3 folds),0.623 +/- 0.080 (in 3 folds),0.846,0.624,disease.separate_past_exposures,319,0,319,0.0,False
linearsvm_ovr,0.899 +/- 0.004 (in 3 folds),0.899 +/- 0.004 (in 3 folds),0.848 +/- 0.013 (in 3 folds),0.848 +/- 0.013 (in 3 folds),0.834 +/- 0.009 (in 3 folds),0.615 +/- 0.017 (in 3 folds),0.834,0.613,disease.separate_past_exposures,319,0,319,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.899 +/- 0.004 (in 3 folds),0.899 +/- 0.004 (in 3 folds),0.848 +/- 0.013 (in 3 folds),0.848 +/- 0.013 (in 3 folds),0.825 +/- 0.026 (in 3 folds),0.625 +/- 0.049 (in 3 folds),0.824,0.601,disease.separate_past_exposures,319,0,319,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/lupus_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.ethnicity_condensed_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/ethnicity_condensed_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.758 +/- 0.043 (in 3 folds),0.764 +/- 0.025 (in 3 folds),0.736 +/- 0.029 (in 3 folds),0.737 +/- 0.023 (in 3 folds),0.624 +/- 0.016 (in 3 folds),0.375 +/- 0.049 (in 3 folds),0.623,0.375,191,0,191,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.758 +/- 0.043 (in 3 folds),0.764 +/- 0.025 (in 3 folds),0.736 +/- 0.029 (in 3 folds),0.737 +/- 0.023 (in 3 folds),0.700 +/- 0.030 (in 3 folds),0.457 +/- 0.024 (in 3 folds),0.702,0.463,191,0,191,0.0,False
elasticnet_cv,0.729 +/- 0.017 (in 3 folds),0.737 +/- 0.006 (in 3 folds),0.735 +/- 0.016 (in 3 folds),0.747 +/- 0.006 (in 3 folds),0.567 +/- 0.081 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.571,0.0,191,0,191,0.0,True
elasticnet_cv.decision_thresholds_tuned,0.729 +/- 0.017 (in 3 folds),0.737 +/- 0.006 (in 3 folds),0.735 +/- 0.016 (in 3 folds),0.747 +/- 0.006 (in 3 folds),0.714 +/- 0.066 (in 3 folds),0.498 +/- 0.106 (in 3 folds),0.717,0.497,191,0,191,0.0,True
lasso_cv,0.723 +/- 0.028 (in 3 folds),0.725 +/- 0.021 (in 3 folds),0.730 +/- 0.030 (in 3 folds),0.738 +/- 0.022 (in 3 folds),0.567 +/- 0.081 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.571,0.0,191,0,191,0.0,True
lasso_cv.decision_thresholds_tuned,0.723 +/- 0.028 (in 3 folds),0.725 +/- 0.021 (in 3 folds),0.730 +/- 0.030 (in 3 folds),0.738 +/- 0.022 (in 3 folds),0.720 +/- 0.044 (in 3 folds),0.505 +/- 0.082 (in 3 folds),0.723,0.508,191,0,191,0.0,True
rf_multiclass,0.712 +/- 0.028 (in 3 folds),0.704 +/- 0.079 (in 3 folds),0.729 +/- 0.054 (in 3 folds),0.723 +/- 0.078 (in 3 folds),0.705 +/- 0.038 (in 3 folds),0.479 +/- 0.026 (in 3 folds),0.707,0.483,191,0,191,0.0,True
rf_multiclass.decision_thresholds_tuned,0.712 +/- 0.028 (in 3 folds),0.704 +/- 0.079 (in 3 folds),0.729 +/- 0.054 (in 3 folds),0.723 +/- 0.078 (in 3 folds),0.738 +/- 0.031 (in 3 folds),0.536 +/- 0.108 (in 3 folds),0.738,0.531,191,0,191,0.0,True
linearsvm_ovr,0.700 +/- 0.050 (in 3 folds),0.689 +/- 0.017 (in 3 folds),0.703 +/- 0.016 (in 3 folds),0.687 +/- 0.018 (in 3 folds),0.624 +/- 0.029 (in 3 folds),0.377 +/- 0.086 (in 3 folds),0.623,0.376,191,0,191,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.700 +/- 0.050 (in 3 folds),0.689 +/- 0.017 (in 3 folds),0.703 +/- 0.016 (in 3 folds),0.687 +/- 0.018 (in 3 folds),0.651 +/- 0.048 (in 3 folds),0.410 +/- 0.094 (in 3 folds),0.649,0.381,191,0,191,0.0,True


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/ethnicity_condensed_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv














GeneLocus.BCR TargetObsColumnEnum.age_group_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/age_group_healthy_only






















































































































































































































Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.665 +/- 0.050 (in 3 folds),0.661 +/- 0.045 (in 3 folds),0.690 +/- 0.016 (in 3 folds),0.680 +/- 0.005 (in 3 folds),0.160 +/- 0.060 (in 3 folds),0.033 +/- 0.057 (in 3 folds),0.157,-0.042,191,0,191,0.0,True
ridge_cv.decision_thresholds_tuned,0.665 +/- 0.050 (in 3 folds),0.661 +/- 0.045 (in 3 folds),0.690 +/- 0.016 (in 3 folds),0.680 +/- 0.005 (in 3 folds),0.357 +/- 0.124 (in 3 folds),0.224 +/- 0.133 (in 3 folds),0.351,0.213,191,0,191,0.0,True
lasso_multiclass,0.665 +/- 0.025 (in 3 folds),0.663 +/- 0.018 (in 3 folds),0.693 +/- 0.003 (in 3 folds),0.681 +/- 0.010 (in 3 folds),0.340 +/- 0.021 (in 3 folds),0.228 +/- 0.021 (in 3 folds),0.34,0.213,191,0,191,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.665 +/- 0.025 (in 3 folds),0.663 +/- 0.018 (in 3 folds),0.693 +/- 0.003 (in 3 folds),0.681 +/- 0.010 (in 3 folds),0.324 +/- 0.044 (in 3 folds),0.207 +/- 0.060 (in 3 folds),0.325,0.189,191,0,191,0.0,True
linearsvm_ovr,0.645 +/- 0.004 (in 3 folds),0.642 +/- 0.003 (in 3 folds),0.677 +/- 0.005 (in 3 folds),0.671 +/- 0.012 (in 3 folds),0.288 +/- 0.043 (in 3 folds),0.165 +/- 0.046 (in 3 folds),0.288,0.147,191,0,191,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.645 +/- 0.004 (in 3 folds),0.642 +/- 0.003 (in 3 folds),0.677 +/- 0.005 (in 3 folds),0.671 +/- 0.012 (in 3 folds),0.320 +/- 0.029 (in 3 folds),0.206 +/- 0.060 (in 3 folds),0.319,0.203,191,0,191,0.0,False
rf_multiclass,0.627 +/- 0.028 (in 3 folds),0.622 +/- 0.022 (in 3 folds),0.670 +/- 0.013 (in 3 folds),0.662 +/- 0.006 (in 3 folds),0.292 +/- 0.076 (in 3 folds),0.188 +/- 0.068 (in 3 folds),0.288,0.138,191,0,191,0.0,True
rf_multiclass.decision_thresholds_tuned,0.627 +/- 0.028 (in 3 folds),0.622 +/- 0.022 (in 3 folds),0.670 +/- 0.013 (in 3 folds),0.662 +/- 0.006 (in 3 folds),0.252 +/- 0.024 (in 3 folds),0.149 +/- 0.040 (in 3 folds),0.251,0.104,191,0,191,0.0,True
elasticnet_cv,0.610 +/- 0.011 (in 3 folds),0.609 +/- 0.019 (in 3 folds),0.662 +/- 0.033 (in 3 folds),0.657 +/- 0.037 (in 3 folds),0.177 +/- 0.020 (in 3 folds),0.145 +/- 0.047 (in 3 folds),0.178,0.001,191,0,191,0.0,True
elasticnet_cv.decision_thresholds_tuned,0.610 +/- 0.011 (in 3 folds),0.609 +/- 0.019 (in 3 folds),0.662 +/- 0.033 (in 3 folds),0.657 +/- 0.037 (in 3 folds),0.244 +/- 0.048 (in 3 folds),0.099 +/- 0.047 (in 3 folds),0.246,0.091,191,0,191,0.0,True


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/age_group_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.age_group_binary_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/age_group_binary_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
rf_multiclass,0.719 +/- 0.026 (in 3 folds),0.719 +/- 0.026 (in 3 folds),0.825 +/- 0.072 (in 3 folds),0.825 +/- 0.072 (in 3 folds),0.669 +/- 0.028 (in 3 folds),0.271 +/- 0.091 (in 3 folds),0.67,0.25,191,0,191,0.0,False
rf_multiclass.decision_thresholds_tuned,0.719 +/- 0.026 (in 3 folds),0.719 +/- 0.026 (in 3 folds),0.825 +/- 0.072 (in 3 folds),0.825 +/- 0.072 (in 3 folds),0.674 +/- 0.033 (in 3 folds),0.306 +/- 0.041 (in 3 folds),0.675,0.301,191,0,191,0.0,False
lasso_multiclass,0.679 +/- 0.042 (in 3 folds),0.679 +/- 0.042 (in 3 folds),0.810 +/- 0.074 (in 3 folds),0.810 +/- 0.074 (in 3 folds),0.675 +/- 0.006 (in 3 folds),0.341 +/- 0.032 (in 3 folds),0.675,0.333,191,0,191,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.679 +/- 0.042 (in 3 folds),0.679 +/- 0.042 (in 3 folds),0.810 +/- 0.074 (in 3 folds),0.810 +/- 0.074 (in 3 folds),0.571 +/- 0.064 (in 3 folds),0.165 +/- 0.042 (in 3 folds),0.571,0.178,191,0,191,0.0,False
xgboost,0.676 +/- 0.007 (in 3 folds),0.676 +/- 0.007 (in 3 folds),0.804 +/- 0.039 (in 3 folds),0.804 +/- 0.039 (in 3 folds),0.654 +/- 0.015 (in 3 folds),0.258 +/- 0.006 (in 3 folds),0.654,0.256,191,0,191,0.0,False
xgboost.decision_thresholds_tuned,0.676 +/- 0.007 (in 3 folds),0.676 +/- 0.007 (in 3 folds),0.804 +/- 0.039 (in 3 folds),0.804 +/- 0.039 (in 3 folds),0.636 +/- 0.058 (in 3 folds),0.292 +/- 0.036 (in 3 folds),0.639,0.298,191,0,191,0.0,False
linearsvm_ovr,0.675 +/- 0.019 (in 3 folds),0.675 +/- 0.019 (in 3 folds),0.811 +/- 0.045 (in 3 folds),0.811 +/- 0.045 (in 3 folds),0.617 +/- 0.044 (in 3 folds),0.208 +/- 0.063 (in 3 folds),0.618,0.194,191,0,191,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.675 +/- 0.019 (in 3 folds),0.675 +/- 0.019 (in 3 folds),0.811 +/- 0.045 (in 3 folds),0.811 +/- 0.045 (in 3 folds),0.562 +/- 0.087 (in 3 folds),0.235 +/- 0.100 (in 3 folds),0.56,0.175,191,0,191,0.0,False
elasticnet_cv,0.599 +/- 0.086 (in 3 folds),0.599 +/- 0.086 (in 3 folds),0.729 +/- 0.050 (in 3 folds),0.729 +/- 0.050 (in 3 folds),0.620 +/- 0.065 (in 3 folds),-0.036 +/- 0.080 (in 3 folds),0.623,-0.035,191,0,191,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.599 +/- 0.086 (in 3 folds),0.599 +/- 0.086 (in 3 folds),0.729 +/- 0.050 (in 3 folds),0.729 +/- 0.050 (in 3 folds),0.556 +/- 0.132 (in 3 folds),0.100 +/- 0.086 (in 3 folds),0.555,0.107,191,0,191,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/age_group_binary_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.BCR TargetObsColumnEnum.sex_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/sex_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
rf_multiclass,0.555 +/- 0.036 (in 3 folds),0.555 +/- 0.036 (in 3 folds),0.554 +/- 0.085 (in 3 folds),0.554 +/- 0.085 (in 3 folds),0.548 +/- 0.076 (in 3 folds),0.105 +/- 0.110 (in 3 folds),0.545,0.099,191,0,191,0.0,False
rf_multiclass.decision_thresholds_tuned,0.555 +/- 0.036 (in 3 folds),0.555 +/- 0.036 (in 3 folds),0.554 +/- 0.085 (in 3 folds),0.554 +/- 0.085 (in 3 folds),0.541 +/- 0.042 (in 3 folds),0.040 +/- 0.047 (in 3 folds),0.539,0.08,191,0,191,0.0,False
lasso_multiclass,0.519 +/- 0.022 (in 3 folds),0.519 +/- 0.022 (in 3 folds),0.544 +/- 0.052 (in 3 folds),0.544 +/- 0.052 (in 3 folds),0.504 +/- 0.033 (in 3 folds),0.022 +/- 0.049 (in 3 folds),0.503,0.011,191,0,191,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.519 +/- 0.022 (in 3 folds),0.519 +/- 0.022 (in 3 folds),0.544 +/- 0.052 (in 3 folds),0.544 +/- 0.052 (in 3 folds),0.551 +/- 0.052 (in 3 folds),0.095 +/- 0.100 (in 3 folds),0.55,0.098,191,0,191,0.0,False
xgboost,0.517 +/- 0.067 (in 3 folds),0.517 +/- 0.067 (in 3 folds),0.524 +/- 0.043 (in 3 folds),0.524 +/- 0.043 (in 3 folds),0.525 +/- 0.041 (in 3 folds),0.058 +/- 0.098 (in 3 folds),0.524,0.056,191,0,191,0.0,False
xgboost.decision_thresholds_tuned,0.517 +/- 0.067 (in 3 folds),0.517 +/- 0.067 (in 3 folds),0.524 +/- 0.043 (in 3 folds),0.524 +/- 0.043 (in 3 folds),0.480 +/- 0.063 (in 3 folds),-0.015 +/- 0.093 (in 3 folds),0.476,-0.032,191,0,191,0.0,False
linearsvm_ovr,0.515 +/- 0.030 (in 3 folds),0.515 +/- 0.030 (in 3 folds),0.541 +/- 0.069 (in 3 folds),0.541 +/- 0.069 (in 3 folds),0.488 +/- 0.036 (in 3 folds),-0.017 +/- 0.073 (in 3 folds),0.487,-0.024,191,0,191,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.515 +/- 0.030 (in 3 folds),0.515 +/- 0.030 (in 3 folds),0.541 +/- 0.069 (in 3 folds),0.541 +/- 0.069 (in 3 folds),0.495 +/- 0.053 (in 3 folds),-0.028 +/- 0.083 (in 3 folds),0.492,-0.01,191,0,191,0.0,False
ridge_cv,0.512 +/- 0.021 (in 3 folds),0.512 +/- 0.021 (in 3 folds),0.498 +/- 0.082 (in 3 folds),0.498 +/- 0.082 (in 3 folds),0.498 +/- 0.052 (in 3 folds),0.001 +/- 0.001 (in 3 folds),0.497,-0.002,191,0,191,0.0,False
ridge_cv.decision_thresholds_tuned,0.512 +/- 0.021 (in 3 folds),0.512 +/- 0.021 (in 3 folds),0.498 +/- 0.082 (in 3 folds),0.498 +/- 0.082 (in 3 folds),0.490 +/- 0.069 (in 3 folds),0.049 +/- 0.085 (in 3 folds),0.487,0.07,191,0,191,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/BCR/sex_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv


2022-12-31 04:27:23,178 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.0.validation.h5ad -> /srv/scratch/maximz/cache/45c3001c6b505500991147d20f972274565d8728487b87ce1a92bfe9.0.validation.h5ad


GeneLocus.TCR
Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 04:36:20,268 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 35 specimens




2022-12-31 04:38:56,095 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 27 specimens




2022-12-31 04:41:48,456 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 34 specimens




2022-12-31 04:44:58,152 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 10 specimens (413445 rows)


2022-12-31 04:45:12,779 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 44 specimens




2022-12-31 04:48:00,670 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (11386 rows)


2022-12-31 04:48:16,902 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens




2022-12-31 04:52:00,447 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (11386 rows)


2022-12-31 04:52:20,104 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens
IOStream.flush timed out




2022-12-31 04:55:47,066 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 48 specimens


2022-12-31 04:57:43,078 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.1.validation.h5ad -> /srv/scratch/maximz/cache/282f72b2420811c056ecfc2ef1dcbf10523046eb9569d7ff2d7c8263.1.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 05:07:27,415 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 36 specimens




2022-12-31 05:10:09,702 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 26 specimens




2022-12-31 05:13:19,166 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 34 specimens




2022-12-31 05:16:34,643 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 11 specimens (475392 rows)


2022-12-31 05:17:06,529 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 41 specimens




2022-12-31 05:22:26,435 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (18790 rows)


2022-12-31 05:22:46,712 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens




2022-12-31 05:26:09,556 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (18790 rows)


2022-12-31 05:26:27,620 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens




2022-12-31 05:29:14,148 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 48 specimens


2022-12-31 05:30:59,428 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.2.validation.h5ad -> /srv/scratch/maximz/cache/1ca7b8d5a7e7747e7f0bda4a4f3cb1e09d543670afe9d48fe77350c1.2.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].






2022-12-31 05:36:36,338 - malid.train.training_utils - INFO - Skipping lasso_cv from 2 because file not found: [Errno 2] No such file or directory: '/users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/repertoire_stats/TCR/disease_all_demographics_present/train_smaller_model.lasso_cv.2.joblib'




2022-12-31 05:39:29,356 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 35 specimens




2022-12-31 05:42:44,187 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 27 specimens




2022-12-31 05:46:12,287 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 34 specimens




2022-12-31 05:49:24,157 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 11 specimens (476014 rows)


2022-12-31 05:49:40,928 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 42 specimens




2022-12-31 05:52:39,600 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (6847 rows)


2022-12-31 05:52:57,664 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens




2022-12-31 05:57:50,945 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (6847 rows)


2022-12-31 05:58:09,255 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 47 specimens




2022-12-31 06:00:45,797 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 48 specimens


2022-12-31 06:02:24,815 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.-1.validation.h5ad -> /srv/scratch/maximz/cache/1985239f55fdf391d2f6c78098bab25182948ad31b330c01c26cb651.-1.validation.h5ad


Only considering the two last: ['.validation', '.h5ad'].


Only considering the two last: ['.validation', '.h5ad'].








2022-12-31 06:30:56,669 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 55 specimens




2022-12-31 06:41:16,573 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 41 specimens




2022-12-31 06:53:47,411 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 52 specimens




2022-12-31 07:08:51,231 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 19 specimens (862171 rows)


2022-12-31 07:11:59,170 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 64 specimens




2022-12-31 07:33:12,661 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (6847 rows)


2022-12-31 07:40:25,886 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens




2022-12-31 07:59:06,746 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (6847 rows)


2022-12-31 08:00:43,698 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens




2022-12-31 08:12:47,763 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 74 specimens


GeneLocus.TCR TargetObsColumnEnum.disease


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.945 +/- 0.008 (in 3 folds),0.946 +/- 0.006 (in 3 folds),0.934 +/- 0.008 (in 3 folds),0.937 +/- 0.005 (in 3 folds),0.759 +/- 0.036 (in 3 folds),0.669 +/- 0.047 (in 3 folds),0.759,0.667,274,0,274,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.945 +/- 0.008 (in 3 folds),0.946 +/- 0.006 (in 3 folds),0.934 +/- 0.008 (in 3 folds),0.937 +/- 0.005 (in 3 folds),0.821 +/- 0.022 (in 3 folds),0.748 +/- 0.030 (in 3 folds),0.821,0.747,274,0,274,0.0,False
ridge_cv,0.944 +/- 0.018 (in 3 folds),0.945 +/- 0.016 (in 3 folds),0.928 +/- 0.016 (in 3 folds),0.934 +/- 0.012 (in 3 folds),0.474 +/- 0.003 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.474,0.0,274,0,274,0.0,True
ridge_cv.decision_thresholds_tuned,0.944 +/- 0.018 (in 3 folds),0.945 +/- 0.016 (in 3 folds),0.928 +/- 0.016 (in 3 folds),0.934 +/- 0.012 (in 3 folds),0.556 +/- 0.353 (in 3 folds),0.448 +/- 0.393 (in 3 folds),0.555,0.444,274,0,274,0.0,False
linearsvm_ovr,0.943 +/- 0.016 (in 3 folds),0.941 +/- 0.015 (in 3 folds),0.932 +/- 0.013 (in 3 folds),0.932 +/- 0.010 (in 3 folds),0.777 +/- 0.031 (in 3 folds),0.686 +/- 0.043 (in 3 folds),0.777,0.684,274,0,274,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.943 +/- 0.016 (in 3 folds),0.941 +/- 0.015 (in 3 folds),0.932 +/- 0.013 (in 3 folds),0.932 +/- 0.010 (in 3 folds),0.832 +/- 0.044 (in 3 folds),0.764 +/- 0.055 (in 3 folds),0.832,0.754,274,0,274,0.0,False
elasticnet_cv,0.941 +/- 0.015 (in 3 folds),0.941 +/- 0.013 (in 3 folds),0.912 +/- 0.010 (in 3 folds),0.917 +/- 0.007 (in 3 folds),0.730 +/- 0.060 (in 3 folds),0.595 +/- 0.103 (in 3 folds),0.73,0.594,274,0,274,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.941 +/- 0.015 (in 3 folds),0.941 +/- 0.013 (in 3 folds),0.912 +/- 0.010 (in 3 folds),0.917 +/- 0.007 (in 3 folds),0.825 +/- 0.039 (in 3 folds),0.760 +/- 0.052 (in 3 folds),0.825,0.758,274,0,274,0.0,False
rf_multiclass,0.936 +/- 0.013 (in 3 folds),0.938 +/- 0.011 (in 3 folds),0.926 +/- 0.009 (in 3 folds),0.931 +/- 0.008 (in 3 folds),0.752 +/- 0.040 (in 3 folds),0.629 +/- 0.059 (in 3 folds),0.752,0.627,274,0,274,0.0,False
rf_multiclass.decision_thresholds_tuned,0.936 +/- 0.013 (in 3 folds),0.938 +/- 0.011 (in 3 folds),0.926 +/- 0.009 (in 3 folds),0.931 +/- 0.008 (in 3 folds),0.825 +/- 0.022 (in 3 folds),0.751 +/- 0.029 (in 3 folds),0.825,0.749,274,0,274,0.0,False


2022-12-31 08:14:14,140 - malid.external.model_evaluation - INFO - Removing ('lasso_cv', 0) because lasso_cv is incomplete.


2022-12-31 08:14:14,142 - malid.external.model_evaluation - INFO - Removing ('lasso_cv', 1) because lasso_cv is incomplete.


2022-12-31 08:14:14,143 - malid.external.model_evaluation - INFO - Removing ('lasso_cv.decision_thresholds_tuned', 0) because lasso_cv.decision_thresholds_tuned is incomplete.


2022-12-31 08:14:14,144 - malid.external.model_evaluation - INFO - Removing ('lasso_cv.decision_thresholds_tuned', 1) because lasso_cv.decision_thresholds_tuned is incomplete.


GeneLocus.TCR TargetObsColumnEnum.disease_all_demographics_present


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.946 +/- 0.027 (in 3 folds),0.947 +/- 0.028 (in 3 folds),0.942 +/- 0.027 (in 3 folds),0.944 +/- 0.026 (in 3 folds),0.808 +/- 0.033 (in 3 folds),0.723 +/- 0.057 (in 3 folds),0.808,0.724,240,0,240,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.946 +/- 0.027 (in 3 folds),0.947 +/- 0.028 (in 3 folds),0.942 +/- 0.027 (in 3 folds),0.944 +/- 0.026 (in 3 folds),0.858 +/- 0.027 (in 3 folds),0.806 +/- 0.033 (in 3 folds),0.858,0.804,240,0,240,0.0,False
ridge_cv,0.944 +/- 0.026 (in 3 folds),0.944 +/- 0.025 (in 3 folds),0.932 +/- 0.029 (in 3 folds),0.936 +/- 0.028 (in 3 folds),0.483 +/- 0.009 (in 3 folds),0.039 +/- 0.068 (in 3 folds),0.483,0.07,240,0,240,0.0,True
ridge_cv.decision_thresholds_tuned,0.944 +/- 0.026 (in 3 folds),0.944 +/- 0.025 (in 3 folds),0.932 +/- 0.029 (in 3 folds),0.936 +/- 0.028 (in 3 folds),0.772 +/- 0.160 (in 3 folds),0.678 +/- 0.227 (in 3 folds),0.771,0.675,240,0,240,0.0,False
lasso_multiclass,0.944 +/- 0.024 (in 3 folds),0.946 +/- 0.022 (in 3 folds),0.940 +/- 0.016 (in 3 folds),0.944 +/- 0.015 (in 3 folds),0.817 +/- 0.033 (in 3 folds),0.741 +/- 0.051 (in 3 folds),0.817,0.741,240,0,240,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.944 +/- 0.024 (in 3 folds),0.946 +/- 0.022 (in 3 folds),0.940 +/- 0.016 (in 3 folds),0.944 +/- 0.015 (in 3 folds),0.854 +/- 0.020 (in 3 folds),0.799 +/- 0.025 (in 3 folds),0.854,0.798,240,0,240,0.0,False
elasticnet_cv,0.936 +/- 0.031 (in 3 folds),0.938 +/- 0.029 (in 3 folds),0.922 +/- 0.029 (in 3 folds),0.926 +/- 0.028 (in 3 folds),0.758 +/- 0.065 (in 3 folds),0.634 +/- 0.118 (in 3 folds),0.758,0.636,240,0,240,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.936 +/- 0.031 (in 3 folds),0.938 +/- 0.029 (in 3 folds),0.922 +/- 0.029 (in 3 folds),0.926 +/- 0.028 (in 3 folds),0.837 +/- 0.022 (in 3 folds),0.777 +/- 0.032 (in 3 folds),0.838,0.777,240,0,240,0.0,False
rf_multiclass,0.925 +/- 0.029 (in 3 folds),0.928 +/- 0.024 (in 3 folds),0.910 +/- 0.030 (in 3 folds),0.918 +/- 0.025 (in 3 folds),0.771 +/- 0.052 (in 3 folds),0.655 +/- 0.085 (in 3 folds),0.771,0.656,240,0,240,0.0,False
rf_multiclass.decision_thresholds_tuned,0.925 +/- 0.029 (in 3 folds),0.928 +/- 0.024 (in 3 folds),0.910 +/- 0.030 (in 3 folds),0.918 +/- 0.025 (in 3 folds),0.821 +/- 0.048 (in 3 folds),0.753 +/- 0.063 (in 3 folds),0.821,0.75,240,0,240,0.0,False


GeneLocus.TCR TargetObsColumnEnum.covid_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.997 +/- 0.003 (in 3 folds),0.997 +/- 0.003 (in 3 folds),0.999 +/- 0.001 (in 3 folds),0.999 +/- 0.001 (in 3 folds),0.803 +/- 0.049 (in 3 folds),0.190 +/- 0.329 (in 3 folds),0.804,0.324,168,0,168,0.0,False
ridge_cv.decision_thresholds_tuned,0.997 +/- 0.003 (in 3 folds),0.997 +/- 0.003 (in 3 folds),0.999 +/- 0.001 (in 3 folds),0.999 +/- 0.001 (in 3 folds),0.982 +/- 0.018 (in 3 folds),0.949 +/- 0.053 (in 3 folds),0.982,0.95,168,0,168,0.0,False
lasso_multiclass,0.991 +/- 0.005 (in 3 folds),0.991 +/- 0.005 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.952 +/- 0.028 (in 3 folds),0.861 +/- 0.086 (in 3 folds),0.952,0.862,168,0,168,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.991 +/- 0.005 (in 3 folds),0.991 +/- 0.005 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.964 +/- 0.018 (in 3 folds),0.907 +/- 0.044 (in 3 folds),0.964,0.904,168,0,168,0.0,False
rf_multiclass,0.990 +/- 0.004 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.868 +/- 0.069 (in 3 folds),0.578 +/- 0.233 (in 3 folds),0.869,0.595,168,0,168,0.0,False
rf_multiclass.decision_thresholds_tuned,0.990 +/- 0.004 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.970 +/- 0.010 (in 3 folds),0.918 +/- 0.025 (in 3 folds),0.97,0.914,168,0,168,0.0,False
elasticnet_cv,0.988 +/- 0.012 (in 3 folds),0.988 +/- 0.012 (in 3 folds),0.997 +/- 0.003 (in 3 folds),0.997 +/- 0.003 (in 3 folds),0.874 +/- 0.084 (in 3 folds),0.577 +/- 0.320 (in 3 folds),0.875,0.613,168,0,168,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.988 +/- 0.012 (in 3 folds),0.988 +/- 0.012 (in 3 folds),0.997 +/- 0.003 (in 3 folds),0.997 +/- 0.003 (in 3 folds),0.964 +/- 0.019 (in 3 folds),0.905 +/- 0.045 (in 3 folds),0.964,0.904,168,0,168,0.0,False
xgboost,0.981 +/- 0.020 (in 3 folds),0.981 +/- 0.020 (in 3 folds),0.995 +/- 0.006 (in 3 folds),0.995 +/- 0.006 (in 3 folds),0.910 +/- 0.048 (in 3 folds),0.727 +/- 0.156 (in 3 folds),0.911,0.732,168,0,168,0.0,False
xgboost.decision_thresholds_tuned,0.981 +/- 0.020 (in 3 folds),0.981 +/- 0.020 (in 3 folds),0.995 +/- 0.006 (in 3 folds),0.995 +/- 0.006 (in 3 folds),0.958 +/- 0.027 (in 3 folds),0.880 +/- 0.081 (in 3 folds),0.958,0.88,168,0,168,0.0,False


GeneLocus.TCR TargetObsColumnEnum.hiv_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.932 +/- 0.036 (in 3 folds),0.932 +/- 0.036 (in 3 folds),0.972 +/- 0.015 (in 3 folds),0.972 +/- 0.015 (in 3 folds),0.851 +/- 0.017 (in 3 folds),0.698 +/- 0.055 (in 3 folds),0.851,0.695,194,0,194,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.932 +/- 0.036 (in 3 folds),0.932 +/- 0.036 (in 3 folds),0.972 +/- 0.015 (in 3 folds),0.972 +/- 0.015 (in 3 folds),0.887 +/- 0.046 (in 3 folds),0.779 +/- 0.069 (in 3 folds),0.887,0.766,194,0,194,0.0,False
linearsvm_ovr,0.932 +/- 0.028 (in 3 folds),0.932 +/- 0.028 (in 3 folds),0.971 +/- 0.012 (in 3 folds),0.971 +/- 0.012 (in 3 folds),0.861 +/- 0.030 (in 3 folds),0.709 +/- 0.078 (in 3 folds),0.861,0.708,194,0,194,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.932 +/- 0.028 (in 3 folds),0.932 +/- 0.028 (in 3 folds),0.971 +/- 0.012 (in 3 folds),0.971 +/- 0.012 (in 3 folds),0.866 +/- 0.038 (in 3 folds),0.726 +/- 0.060 (in 3 folds),0.866,0.722,194,0,194,0.0,False
lasso_cv,0.924 +/- 0.022 (in 3 folds),0.924 +/- 0.022 (in 3 folds),0.968 +/- 0.009 (in 3 folds),0.968 +/- 0.009 (in 3 folds),0.845 +/- 0.014 (in 3 folds),0.680 +/- 0.056 (in 3 folds),0.845,0.677,194,0,194,0.0,False
lasso_cv.decision_thresholds_tuned,0.924 +/- 0.022 (in 3 folds),0.924 +/- 0.022 (in 3 folds),0.968 +/- 0.009 (in 3 folds),0.968 +/- 0.009 (in 3 folds),0.861 +/- 0.026 (in 3 folds),0.742 +/- 0.030 (in 3 folds),0.861,0.74,194,0,194,0.0,False
elasticnet_cv,0.922 +/- 0.026 (in 3 folds),0.922 +/- 0.026 (in 3 folds),0.967 +/- 0.011 (in 3 folds),0.967 +/- 0.011 (in 3 folds),0.845 +/- 0.014 (in 3 folds),0.680 +/- 0.056 (in 3 folds),0.845,0.677,194,0,194,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.922 +/- 0.026 (in 3 folds),0.922 +/- 0.026 (in 3 folds),0.967 +/- 0.011 (in 3 folds),0.967 +/- 0.011 (in 3 folds),0.856 +/- 0.031 (in 3 folds),0.733 +/- 0.056 (in 3 folds),0.856,0.732,194,0,194,0.0,False
ridge_cv,0.921 +/- 0.036 (in 3 folds),0.921 +/- 0.036 (in 3 folds),0.967 +/- 0.014 (in 3 folds),0.967 +/- 0.014 (in 3 folds),0.753 +/- 0.081 (in 3 folds),0.348 +/- 0.304 (in 3 folds),0.753,0.4,194,0,194,0.0,False
ridge_cv.decision_thresholds_tuned,0.921 +/- 0.036 (in 3 folds),0.921 +/- 0.036 (in 3 folds),0.967 +/- 0.014 (in 3 folds),0.967 +/- 0.014 (in 3 folds),0.815 +/- 0.136 (in 3 folds),0.507 +/- 0.445 (in 3 folds),0.814,0.563,194,0,194,0.0,False


GeneLocus.TCR TargetObsColumnEnum.lupus_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.985 +/- 0.010 (in 3 folds),0.985 +/- 0.010 (in 3 folds),0.960 +/- 0.023 (in 3 folds),0.960 +/- 0.023 (in 3 folds),0.918 +/- 0.037 (in 3 folds),0.773 +/- 0.105 (in 3 folds),0.919,0.773,172,0,172,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.985 +/- 0.010 (in 3 folds),0.985 +/- 0.010 (in 3 folds),0.960 +/- 0.023 (in 3 folds),0.960 +/- 0.023 (in 3 folds),0.953 +/- 0.020 (in 3 folds),0.877 +/- 0.057 (in 3 folds),0.953,0.876,172,0,172,0.0,False
rf_multiclass,0.984 +/- 0.013 (in 3 folds),0.984 +/- 0.013 (in 3 folds),0.962 +/- 0.029 (in 3 folds),0.962 +/- 0.029 (in 3 folds),0.913 +/- 0.047 (in 3 folds),0.755 +/- 0.135 (in 3 folds),0.913,0.756,172,0,172,0.0,False
rf_multiclass.decision_thresholds_tuned,0.984 +/- 0.013 (in 3 folds),0.984 +/- 0.013 (in 3 folds),0.962 +/- 0.029 (in 3 folds),0.962 +/- 0.029 (in 3 folds),0.965 +/- 0.018 (in 3 folds),0.905 +/- 0.050 (in 3 folds),0.965,0.904,172,0,172,0.0,False
lasso_cv,0.984 +/- 0.008 (in 3 folds),0.984 +/- 0.008 (in 3 folds),0.954 +/- 0.022 (in 3 folds),0.954 +/- 0.022 (in 3 folds),0.913 +/- 0.047 (in 3 folds),0.753 +/- 0.143 (in 3 folds),0.913,0.755,172,0,172,0.0,False
lasso_cv.decision_thresholds_tuned,0.984 +/- 0.008 (in 3 folds),0.984 +/- 0.008 (in 3 folds),0.954 +/- 0.022 (in 3 folds),0.954 +/- 0.022 (in 3 folds),0.959 +/- 0.010 (in 3 folds),0.889 +/- 0.029 (in 3 folds),0.959,0.888,172,0,172,0.0,False
ridge_cv,0.983 +/- 0.008 (in 3 folds),0.983 +/- 0.008 (in 3 folds),0.959 +/- 0.012 (in 3 folds),0.959 +/- 0.012 (in 3 folds),0.872 +/- 0.103 (in 3 folds),0.537 +/- 0.468 (in 3 folds),0.872,0.633,172,0,172,0.0,False
ridge_cv.decision_thresholds_tuned,0.983 +/- 0.008 (in 3 folds),0.983 +/- 0.008 (in 3 folds),0.959 +/- 0.012 (in 3 folds),0.959 +/- 0.012 (in 3 folds),0.889 +/- 0.117 (in 3 folds),0.588 +/- 0.509 (in 3 folds),0.89,0.687,172,0,172,0.0,False
lasso_multiclass,0.979 +/- 0.009 (in 3 folds),0.979 +/- 0.009 (in 3 folds),0.944 +/- 0.026 (in 3 folds),0.944 +/- 0.026 (in 3 folds),0.924 +/- 0.009 (in 3 folds),0.796 +/- 0.021 (in 3 folds),0.924,0.794,172,0,172,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.979 +/- 0.009 (in 3 folds),0.979 +/- 0.009 (in 3 folds),0.944 +/- 0.026 (in 3 folds),0.944 +/- 0.026 (in 3 folds),0.959 +/- 0.010 (in 3 folds),0.889 +/- 0.029 (in 3 folds),0.959,0.888,172,0,172,0.0,False


GeneLocus.TCR TargetObsColumnEnum.ethnicity_condensed_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_cv,0.726 +/- 0.021 (in 3 folds),0.745 +/- 0.033 (in 3 folds),0.761 +/- 0.004 (in 3 folds),0.776 +/- 0.010 (in 3 folds),0.618 +/- 0.169 (in 3 folds),0.375 +/- 0.326 (in 3 folds),0.617,0.415,115,0,115,0.0,True
lasso_cv.decision_thresholds_tuned,0.726 +/- 0.021 (in 3 folds),0.745 +/- 0.033 (in 3 folds),0.761 +/- 0.004 (in 3 folds),0.776 +/- 0.010 (in 3 folds),0.686 +/- 0.072 (in 3 folds),0.551 +/- 0.036 (in 3 folds),0.687,0.549,115,0,115,0.0,True
ridge_cv,0.723 +/- 0.009 (in 3 folds),0.750 +/- 0.018 (in 3 folds),0.746 +/- 0.021 (in 3 folds),0.762 +/- 0.032 (in 3 folds),0.504 +/- 0.098 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.504,0.0,115,0,115,0.0,True
ridge_cv.decision_thresholds_tuned,0.723 +/- 0.009 (in 3 folds),0.750 +/- 0.018 (in 3 folds),0.746 +/- 0.021 (in 3 folds),0.762 +/- 0.032 (in 3 folds),0.482 +/- 0.254 (in 3 folds),0.176 +/- 0.304 (in 3 folds),0.487,0.19,115,0,115,0.0,True
elasticnet_cv,0.721 +/- 0.017 (in 3 folds),0.738 +/- 0.018 (in 3 folds),0.759 +/- 0.007 (in 3 folds),0.775 +/- 0.006 (in 3 folds),0.567 +/- 0.114 (in 3 folds),0.178 +/- 0.308 (in 3 folds),0.565,0.296,115,0,115,0.0,True
elasticnet_cv.decision_thresholds_tuned,0.721 +/- 0.017 (in 3 folds),0.738 +/- 0.018 (in 3 folds),0.759 +/- 0.007 (in 3 folds),0.775 +/- 0.006 (in 3 folds),0.686 +/- 0.072 (in 3 folds),0.551 +/- 0.036 (in 3 folds),0.687,0.549,115,0,115,0.0,True
lasso_multiclass,0.689 +/- 0.033 (in 3 folds),0.713 +/- 0.045 (in 3 folds),0.731 +/- 0.022 (in 3 folds),0.750 +/- 0.039 (in 3 folds),0.592 +/- 0.114 (in 3 folds),0.370 +/- 0.119 (in 3 folds),0.591,0.362,115,0,115,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.689 +/- 0.033 (in 3 folds),0.713 +/- 0.045 (in 3 folds),0.731 +/- 0.022 (in 3 folds),0.750 +/- 0.039 (in 3 folds),0.695 +/- 0.066 (in 3 folds),0.561 +/- 0.032 (in 3 folds),0.696,0.561,115,0,115,0.0,True
linearsvm_ovr,0.683 +/- 0.019 (in 3 folds),0.704 +/- 0.028 (in 3 folds),0.726 +/- 0.019 (in 3 folds),0.744 +/- 0.041 (in 3 folds),0.584 +/- 0.110 (in 3 folds),0.326 +/- 0.170 (in 3 folds),0.583,0.32,115,0,115,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.683 +/- 0.019 (in 3 folds),0.704 +/- 0.028 (in 3 folds),0.726 +/- 0.019 (in 3 folds),0.744 +/- 0.041 (in 3 folds),0.713 +/- 0.066 (in 3 folds),0.578 +/- 0.046 (in 3 folds),0.713,0.578,115,0,115,0.0,True














GeneLocus.TCR TargetObsColumnEnum.age_group_healthy_only






















































































































































































































Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.699 +/- 0.066 (in 3 folds),0.677 +/- 0.089 (in 3 folds),0.731 +/- 0.069 (in 3 folds),0.715 +/- 0.086 (in 3 folds),0.427 +/- 0.038 (in 3 folds),0.316 +/- 0.048 (in 3 folds),0.426,0.315,115,0,115,0.0,True
lasso_multiclass.decision_thresholds_tuned,0.699 +/- 0.066 (in 3 folds),0.677 +/- 0.089 (in 3 folds),0.731 +/- 0.069 (in 3 folds),0.715 +/- 0.086 (in 3 folds),0.557 +/- 0.061 (in 3 folds),0.486 +/- 0.079 (in 3 folds),0.557,0.468,115,0,115,0.0,False
linearsvm_ovr,0.692 +/- 0.066 (in 3 folds),0.668 +/- 0.093 (in 3 folds),0.730 +/- 0.064 (in 3 folds),0.713 +/- 0.084 (in 3 folds),0.427 +/- 0.053 (in 3 folds),0.313 +/- 0.058 (in 3 folds),0.426,0.309,115,0,115,0.0,True
linearsvm_ovr.decision_thresholds_tuned,0.692 +/- 0.066 (in 3 folds),0.668 +/- 0.093 (in 3 folds),0.730 +/- 0.064 (in 3 folds),0.713 +/- 0.084 (in 3 folds),0.557 +/- 0.041 (in 3 folds),0.495 +/- 0.032 (in 3 folds),0.557,0.473,115,0,115,0.0,True
xgboost,0.689 +/- 0.053 (in 3 folds),0.675 +/- 0.057 (in 3 folds),0.722 +/- 0.057 (in 3 folds),0.709 +/- 0.063 (in 3 folds),0.384 +/- 0.067 (in 3 folds),0.272 +/- 0.075 (in 3 folds),0.383,0.258,115,0,115,0.0,True
xgboost.decision_thresholds_tuned,0.689 +/- 0.053 (in 3 folds),0.675 +/- 0.057 (in 3 folds),0.722 +/- 0.057 (in 3 folds),0.709 +/- 0.063 (in 3 folds),0.497 +/- 0.080 (in 3 folds),0.463 +/- 0.047 (in 3 folds),0.496,0.427,115,0,115,0.0,True
rf_multiclass,0.687 +/- 0.118 (in 3 folds),0.668 +/- 0.141 (in 3 folds),0.731 +/- 0.097 (in 3 folds),0.717 +/- 0.112 (in 3 folds),0.453 +/- 0.065 (in 3 folds),0.362 +/- 0.076 (in 3 folds),0.452,0.34,115,0,115,0.0,True
rf_multiclass.decision_thresholds_tuned,0.687 +/- 0.118 (in 3 folds),0.668 +/- 0.141 (in 3 folds),0.731 +/- 0.097 (in 3 folds),0.717 +/- 0.112 (in 3 folds),0.584 +/- 0.094 (in 3 folds),0.535 +/- 0.083 (in 3 folds),0.583,0.512,115,0,115,0.0,True
ridge_cv,0.672 +/- 0.151 (in 3 folds),0.669 +/- 0.149 (in 3 folds),0.698 +/- 0.172 (in 3 folds),0.696 +/- 0.170 (in 3 folds),0.225 +/- 0.034 (in 3 folds),0.046 +/- 0.080 (in 3 folds),0.226,0.047,115,0,115,0.0,True
ridge_cv.decision_thresholds_tuned,0.672 +/- 0.151 (in 3 folds),0.669 +/- 0.149 (in 3 folds),0.698 +/- 0.172 (in 3 folds),0.696 +/- 0.170 (in 3 folds),0.256 +/- 0.203 (in 3 folds),0.141 +/- 0.244 (in 3 folds),0.252,0.097,115,0,115,0.0,True


GeneLocus.TCR TargetObsColumnEnum.age_group_binary_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
rf_multiclass,0.804 +/- 0.085 (in 3 folds),0.804 +/- 0.085 (in 3 folds),0.896 +/- 0.053 (in 3 folds),0.896 +/- 0.053 (in 3 folds),0.706 +/- 0.092 (in 3 folds),0.353 +/- 0.252 (in 3 folds),0.704,0.315,115,0,115,0.0,False
rf_multiclass.decision_thresholds_tuned,0.804 +/- 0.085 (in 3 folds),0.804 +/- 0.085 (in 3 folds),0.896 +/- 0.053 (in 3 folds),0.896 +/- 0.053 (in 3 folds),0.784 +/- 0.061 (in 3 folds),0.567 +/- 0.113 (in 3 folds),0.783,0.57,115,0,115,0.0,False
lasso_multiclass,0.786 +/- 0.136 (in 3 folds),0.786 +/- 0.136 (in 3 folds),0.893 +/- 0.067 (in 3 folds),0.893 +/- 0.067 (in 3 folds),0.705 +/- 0.059 (in 3 folds),0.393 +/- 0.164 (in 3 folds),0.704,0.373,115,0,115,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.786 +/- 0.136 (in 3 folds),0.786 +/- 0.136 (in 3 folds),0.893 +/- 0.067 (in 3 folds),0.893 +/- 0.067 (in 3 folds),0.715 +/- 0.153 (in 3 folds),0.530 +/- 0.148 (in 3 folds),0.713,0.507,115,0,115,0.0,False
linearsvm_ovr,0.776 +/- 0.159 (in 3 folds),0.776 +/- 0.159 (in 3 folds),0.884 +/- 0.084 (in 3 folds),0.884 +/- 0.084 (in 3 folds),0.723 +/- 0.059 (in 3 folds),0.419 +/- 0.162 (in 3 folds),0.722,0.402,115,0,115,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.776 +/- 0.159 (in 3 folds),0.776 +/- 0.159 (in 3 folds),0.884 +/- 0.084 (in 3 folds),0.884 +/- 0.084 (in 3 folds),0.740 +/- 0.072 (in 3 folds),0.495 +/- 0.208 (in 3 folds),0.739,0.494,115,0,115,0.0,False
xgboost,0.734 +/- 0.117 (in 3 folds),0.734 +/- 0.117 (in 3 folds),0.850 +/- 0.069 (in 3 folds),0.850 +/- 0.069 (in 3 folds),0.671 +/- 0.051 (in 3 folds),0.270 +/- 0.139 (in 3 folds),0.67,0.239,115,0,115,0.0,False
xgboost.decision_thresholds_tuned,0.734 +/- 0.117 (in 3 folds),0.734 +/- 0.117 (in 3 folds),0.850 +/- 0.069 (in 3 folds),0.850 +/- 0.069 (in 3 folds),0.687 +/- 0.116 (in 3 folds),0.425 +/- 0.152 (in 3 folds),0.687,0.384,115,0,115,0.0,False
elasticnet_cv,0.721 +/- 0.123 (in 3 folds),0.721 +/- 0.123 (in 3 folds),0.869 +/- 0.046 (in 3 folds),0.869 +/- 0.046 (in 3 folds),0.670 +/- 0.031 (in 3 folds),0.093 +/- 0.161 (in 3 folds),0.67,0.182,115,0,115,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.721 +/- 0.123 (in 3 folds),0.721 +/- 0.123 (in 3 folds),0.869 +/- 0.046 (in 3 folds),0.869 +/- 0.046 (in 3 folds),0.633 +/- 0.141 (in 3 folds),0.472 +/- 0.163 (in 3 folds),0.635,0.463,115,0,115,0.0,False


GeneLocus.TCR TargetObsColumnEnum.sex_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.569 +/- 0.023 (in 3 folds),0.569 +/- 0.023 (in 3 folds),0.613 +/- 0.148 (in 3 folds),0.613 +/- 0.148 (in 3 folds),0.496 +/- 0.053 (in 3 folds),0.003 +/- 0.063 (in 3 folds),0.496,-0.011,115,0,115,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.569 +/- 0.023 (in 3 folds),0.569 +/- 0.023 (in 3 folds),0.613 +/- 0.148 (in 3 folds),0.613 +/- 0.148 (in 3 folds),0.566 +/- 0.143 (in 3 folds),0.292 +/- 0.059 (in 3 folds),0.565,0.147,115,0,115,0.0,False
rf_multiclass,0.558 +/- 0.046 (in 3 folds),0.558 +/- 0.046 (in 3 folds),0.590 +/- 0.197 (in 3 folds),0.590 +/- 0.197 (in 3 folds),0.539 +/- 0.001 (in 3 folds),0.153 +/- 0.072 (in 3 folds),0.539,0.075,115,0,115,0.0,False
rf_multiclass.decision_thresholds_tuned,0.558 +/- 0.046 (in 3 folds),0.558 +/- 0.046 (in 3 folds),0.590 +/- 0.197 (in 3 folds),0.590 +/- 0.197 (in 3 folds),0.558 +/- 0.067 (in 3 folds),0.250 +/- 0.017 (in 3 folds),0.557,0.119,115,0,115,0.0,False
linearsvm_ovr,0.552 +/- 0.023 (in 3 folds),0.552 +/- 0.023 (in 3 folds),0.607 +/- 0.158 (in 3 folds),0.607 +/- 0.158 (in 3 folds),0.496 +/- 0.054 (in 3 folds),-0.004 +/- 0.077 (in 3 folds),0.496,-0.012,115,0,115,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.552 +/- 0.023 (in 3 folds),0.552 +/- 0.023 (in 3 folds),0.607 +/- 0.158 (in 3 folds),0.607 +/- 0.158 (in 3 folds),0.565 +/- 0.128 (in 3 folds),0.285 +/- 0.028 (in 3 folds),0.565,0.144,115,0,115,0.0,False
lasso_cv,0.521 +/- 0.036 (in 3 folds),0.521 +/- 0.036 (in 3 folds),0.542 +/- 0.216 (in 3 folds),0.542 +/- 0.216 (in 3 folds),0.461 +/- 0.092 (in 3 folds),0.017 +/- 0.030 (in 3 folds),0.461,-0.132,115,0,115,0.0,False
lasso_cv.decision_thresholds_tuned,0.521 +/- 0.036 (in 3 folds),0.521 +/- 0.036 (in 3 folds),0.542 +/- 0.216 (in 3 folds),0.542 +/- 0.216 (in 3 folds),0.555 +/- 0.079 (in 3 folds),0.079 +/- 0.136 (in 3 folds),0.557,0.117,115,0,115,0.0,False
ridge_cv,0.519 +/- 0.032 (in 3 folds),0.519 +/- 0.032 (in 3 folds),0.536 +/- 0.207 (in 3 folds),0.536 +/- 0.207 (in 3 folds),0.384 +/- 0.092 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.383,-0.257,115,0,115,0.0,False
ridge_cv.decision_thresholds_tuned,0.519 +/- 0.032 (in 3 folds),0.519 +/- 0.032 (in 3 folds),0.536 +/- 0.207 (in 3 folds),0.536 +/- 0.207 (in 3 folds),0.513 +/- 0.168 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.513,0.0,115,0,115,0.0,True


2022-12-31 08:14:26,938 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.0.test.h5ad -> /srv/scratch/maximz/cache/a6c3ab8bb9960154ff8dbb5d04eaf7a1c395f034f82f9649aefc9d35.0.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2022-12-31 08:32:59,421 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 55 specimens




2022-12-31 08:40:40,994 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 41 specimens




2022-12-31 08:47:46,581 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 52 specimens




2022-12-31 08:59:29,435 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 19 specimens (862171 rows)


2022-12-31 09:05:35,360 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 64 specimens




2022-12-31 09:17:08,470 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (6847 rows)


2022-12-31 09:23:31,699 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens




2022-12-31 09:36:51,476 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (6847 rows)


2022-12-31 09:42:59,123 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens




2022-12-31 09:48:01,762 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 74 specimens


2022-12-31 09:50:07,862 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.1.test.h5ad -> /srv/scratch/maximz/cache/d3eb18b805f6482478ad1ee75a5249a449864d796469d3e144db1326.1.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2022-12-31 10:11:33,702 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 54 specimens
IOStream.flush timed out




2022-12-31 10:16:29,900 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 41 specimens




2022-12-31 10:21:30,482 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 53 specimens




2022-12-31 10:26:56,879 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 20 specimens (891618 rows)


2022-12-31 10:27:39,518 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 69 specimens




2022-12-31 10:31:15,565 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 1 specimens (11386 rows)


2022-12-31 10:35:31,199 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens




2022-12-31 10:40:02,072 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 1 specimens (11386 rows)


2022-12-31 10:41:25,170 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 73 specimens




2022-12-31 10:45:13,445 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 74 specimens


2022-12-31 10:47:01,619 - malid.external.scratch_cache - INFO - Reading network file from local machine cache: /users/maximz/code/boyd-immune-repertoire-classification/data/data_v_20221224/embedded/unirep_fine_tuned/anndatas_scaled/TCR/fold.2.test.h5ad -> /srv/scratch/maximz/cache/d74a0f1a51ad1e35ec4654f627621ecdc4abf48e3481e399db8af384.2.test.h5ad


Only considering the two last: ['.test', '.h5ad'].


Only considering the two last: ['.test', '.h5ad'].








2022-12-31 11:12:25,195 - malid.helpers - INFO - Target TargetObsColumnEnum.covid_vs_healthy: filtering to specimens from diseases ['Covid19', 'Healthy/Background'] only; removed 53 specimens




2022-12-31 11:26:03,928 - malid.helpers - INFO - Target TargetObsColumnEnum.hiv_vs_healthy: filtering to specimens from diseases ['HIV', 'Healthy/Background'] only; removed 40 specimens




2022-12-31 11:35:03,860 - malid.helpers - INFO - Target TargetObsColumnEnum.lupus_vs_healthy: filtering to specimens from diseases ['Lupus', 'Healthy/Background'] only; removed 51 specimens




2022-12-31 11:48:44,467 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtered to specimens with defined ethnicity_condensed column - removed 14 specimens (388281 rows)


2022-12-31 11:53:29,580 - malid.helpers - INFO - Target TargetObsColumnEnum.ethnicity_condensed_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 62 specimens




2022-12-31 12:03:41,288 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtered to specimens with defined age_group column - removed 2 specimens (96214 rows)


2022-12-31 12:07:59,268 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 71 specimens




2022-12-31 12:14:41,081 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtered to specimens with defined age_group_binary column - removed 2 specimens (96214 rows)


2022-12-31 12:17:51,979 - malid.helpers - INFO - Target TargetObsColumnEnum.age_group_binary_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 71 specimens




2022-12-31 12:22:05,212 - malid.helpers - INFO - Target TargetObsColumnEnum.sex_healthy_only: filtering to specimens from diseases ['Healthy/Background'] only; removed 72 specimens


GeneLocus.TCR TargetObsColumnEnum.disease --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/disease


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.940 +/- 0.009 (in 3 folds),0.940 +/- 0.010 (in 3 folds),0.927 +/- 0.013 (in 3 folds),0.930 +/- 0.013 (in 3 folds),0.761 +/- 0.023 (in 3 folds),0.666 +/- 0.024 (in 3 folds),0.761,0.665,disease.separate_past_exposures,414,0,414,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.940 +/- 0.009 (in 3 folds),0.940 +/- 0.010 (in 3 folds),0.927 +/- 0.013 (in 3 folds),0.930 +/- 0.013 (in 3 folds),0.771 +/- 0.028 (in 3 folds),0.672 +/- 0.034 (in 3 folds),0.771,0.669,disease.separate_past_exposures,414,0,414,0.0,False
rf_multiclass,0.940 +/- 0.008 (in 3 folds),0.941 +/- 0.005 (in 3 folds),0.931 +/- 0.006 (in 3 folds),0.934 +/- 0.003 (in 3 folds),0.761 +/- 0.010 (in 3 folds),0.642 +/- 0.014 (in 3 folds),0.761,0.641,disease.separate_past_exposures,414,0,414,0.0,False
rf_multiclass.decision_thresholds_tuned,0.940 +/- 0.008 (in 3 folds),0.941 +/- 0.005 (in 3 folds),0.931 +/- 0.006 (in 3 folds),0.934 +/- 0.003 (in 3 folds),0.756 +/- 0.045 (in 3 folds),0.660 +/- 0.061 (in 3 folds),0.756,0.656,disease.separate_past_exposures,414,0,414,0.0,False
linearsvm_ovr,0.937 +/- 0.014 (in 3 folds),0.934 +/- 0.016 (in 3 folds),0.921 +/- 0.017 (in 3 folds),0.923 +/- 0.019 (in 3 folds),0.766 +/- 0.043 (in 3 folds),0.666 +/- 0.053 (in 3 folds),0.766,0.664,disease.separate_past_exposures,414,0,414,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.937 +/- 0.014 (in 3 folds),0.934 +/- 0.016 (in 3 folds),0.921 +/- 0.017 (in 3 folds),0.923 +/- 0.019 (in 3 folds),0.723 +/- 0.050 (in 3 folds),0.618 +/- 0.046 (in 3 folds),0.722,0.6,disease.separate_past_exposures,414,0,414,0.0,False
xgboost,0.933 +/- 0.015 (in 3 folds),0.931 +/- 0.011 (in 3 folds),0.931 +/- 0.012 (in 3 folds),0.930 +/- 0.008 (in 3 folds),0.778 +/- 0.013 (in 3 folds),0.674 +/- 0.017 (in 3 folds),0.778,0.673,disease.separate_past_exposures,414,0,414,0.0,False
xgboost.decision_thresholds_tuned,0.933 +/- 0.015 (in 3 folds),0.931 +/- 0.011 (in 3 folds),0.931 +/- 0.012 (in 3 folds),0.930 +/- 0.008 (in 3 folds),0.773 +/- 0.037 (in 3 folds),0.680 +/- 0.050 (in 3 folds),0.773,0.678,disease.separate_past_exposures,414,0,414,0.0,False
ridge_cv,0.933 +/- 0.014 (in 3 folds),0.932 +/- 0.013 (in 3 folds),0.914 +/- 0.017 (in 3 folds),0.917 +/- 0.016 (in 3 folds),0.469 +/- 0.002 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.469,0.0,disease.separate_past_exposures,414,0,414,0.0,True
ridge_cv.decision_thresholds_tuned,0.933 +/- 0.014 (in 3 folds),0.932 +/- 0.013 (in 3 folds),0.914 +/- 0.017 (in 3 folds),0.917 +/- 0.016 (in 3 folds),0.478 +/- 0.284 (in 3 folds),0.352 +/- 0.313 (in 3 folds),0.481,0.357,disease.separate_past_exposures,414,0,414,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/disease/train_smaller_model.compare_model_scores.test_set_performance.tsv


2022-12-31 12:26:03,051 - malid.external.model_evaluation - INFO - Removing ('lasso_cv', 0) because lasso_cv is incomplete.


2022-12-31 12:26:03,054 - malid.external.model_evaluation - INFO - Removing ('lasso_cv', 1) because lasso_cv is incomplete.


2022-12-31 12:26:03,055 - malid.external.model_evaluation - INFO - Removing ('lasso_cv.decision_thresholds_tuned', 0) because lasso_cv.decision_thresholds_tuned is incomplete.


2022-12-31 12:26:03,056 - malid.external.model_evaluation - INFO - Removing ('lasso_cv.decision_thresholds_tuned', 1) because lasso_cv.decision_thresholds_tuned is incomplete.


GeneLocus.TCR TargetObsColumnEnum.disease_all_demographics_present --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/disease_all_demographics_present


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.947 +/- 0.013 (in 3 folds),0.947 +/- 0.017 (in 3 folds),0.939 +/- 0.021 (in 3 folds),0.942 +/- 0.023 (in 3 folds),0.796 +/- 0.038 (in 3 folds),0.707 +/- 0.051 (in 3 folds),0.796,0.706,disease.separate_past_exposures,358,0,358,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.947 +/- 0.013 (in 3 folds),0.947 +/- 0.017 (in 3 folds),0.939 +/- 0.021 (in 3 folds),0.942 +/- 0.023 (in 3 folds),0.774 +/- 0.046 (in 3 folds),0.687 +/- 0.070 (in 3 folds),0.774,0.683,disease.separate_past_exposures,358,0,358,0.0,False
lasso_multiclass,0.947 +/- 0.012 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.938 +/- 0.021 (in 3 folds),0.942 +/- 0.022 (in 3 folds),0.796 +/- 0.034 (in 3 folds),0.714 +/- 0.050 (in 3 folds),0.796,0.713,disease.separate_past_exposures,358,0,358,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.947 +/- 0.012 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.938 +/- 0.021 (in 3 folds),0.942 +/- 0.022 (in 3 folds),0.785 +/- 0.026 (in 3 folds),0.705 +/- 0.021 (in 3 folds),0.785,0.702,disease.separate_past_exposures,358,0,358,0.0,False
rf_multiclass,0.942 +/- 0.006 (in 3 folds),0.943 +/- 0.006 (in 3 folds),0.934 +/- 0.007 (in 3 folds),0.937 +/- 0.007 (in 3 folds),0.796 +/- 0.032 (in 3 folds),0.699 +/- 0.045 (in 3 folds),0.796,0.697,disease.separate_past_exposures,358,0,358,0.0,False
rf_multiclass.decision_thresholds_tuned,0.942 +/- 0.006 (in 3 folds),0.943 +/- 0.006 (in 3 folds),0.934 +/- 0.007 (in 3 folds),0.937 +/- 0.007 (in 3 folds),0.754 +/- 0.021 (in 3 folds),0.662 +/- 0.029 (in 3 folds),0.754,0.659,disease.separate_past_exposures,358,0,358,0.0,False
ridge_cv,0.939 +/- 0.009 (in 3 folds),0.939 +/- 0.010 (in 3 folds),0.928 +/- 0.017 (in 3 folds),0.932 +/- 0.018 (in 3 folds),0.461 +/- 0.034 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.461,0.0,disease.separate_past_exposures,358,0,358,0.0,True
ridge_cv.decision_thresholds_tuned,0.939 +/- 0.009 (in 3 folds),0.939 +/- 0.010 (in 3 folds),0.928 +/- 0.017 (in 3 folds),0.932 +/- 0.018 (in 3 folds),0.710 +/- 0.052 (in 3 folds),0.592 +/- 0.096 (in 3 folds),0.709,0.584,disease.separate_past_exposures,358,0,358,0.0,False
xgboost,0.927 +/- 0.010 (in 3 folds),0.925 +/- 0.011 (in 3 folds),0.923 +/- 0.018 (in 3 folds),0.923 +/- 0.018 (in 3 folds),0.765 +/- 0.025 (in 3 folds),0.654 +/- 0.042 (in 3 folds),0.765,0.654,disease.separate_past_exposures,358,0,358,0.0,False
xgboost.decision_thresholds_tuned,0.927 +/- 0.010 (in 3 folds),0.925 +/- 0.011 (in 3 folds),0.923 +/- 0.018 (in 3 folds),0.923 +/- 0.018 (in 3 folds),0.774 +/- 0.047 (in 3 folds),0.679 +/- 0.074 (in 3 folds),0.774,0.679,disease.separate_past_exposures,358,0,358,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/disease_all_demographics_present/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.covid_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/covid_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.983 +/- 0.006 (in 3 folds),0.983 +/- 0.006 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.897 +/- 0.035 (in 3 folds),0.696 +/- 0.105 (in 3 folds),0.897,0.695,disease.separate_past_exposures,252,0,252,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.983 +/- 0.006 (in 3 folds),0.983 +/- 0.006 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.933 +/- 0.014 (in 3 folds),0.820 +/- 0.037 (in 3 folds),0.933,0.82,disease.separate_past_exposures,252,0,252,0.0,False
ridge_cv,0.983 +/- 0.003 (in 3 folds),0.983 +/- 0.003 (in 3 folds),0.995 +/- 0.000 (in 3 folds),0.995 +/- 0.000 (in 3 folds),0.798 +/- 0.039 (in 3 folds),0.236 +/- 0.258 (in 3 folds),0.798,0.309,disease.separate_past_exposures,252,0,252,0.0,False
ridge_cv.decision_thresholds_tuned,0.983 +/- 0.003 (in 3 folds),0.983 +/- 0.003 (in 3 folds),0.995 +/- 0.000 (in 3 folds),0.995 +/- 0.000 (in 3 folds),0.940 +/- 0.024 (in 3 folds),0.835 +/- 0.069 (in 3 folds),0.94,0.835,disease.separate_past_exposures,252,0,252,0.0,False
lasso_multiclass,0.982 +/- 0.006 (in 3 folds),0.982 +/- 0.006 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.940 +/- 0.013 (in 3 folds),0.836 +/- 0.033 (in 3 folds),0.94,0.835,disease.separate_past_exposures,252,0,252,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.982 +/- 0.006 (in 3 folds),0.982 +/- 0.006 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.913 +/- 0.026 (in 3 folds),0.778 +/- 0.039 (in 3 folds),0.913,0.772,disease.separate_past_exposures,252,0,252,0.0,False
rf_multiclass,0.980 +/- 0.012 (in 3 folds),0.980 +/- 0.012 (in 3 folds),0.994 +/- 0.004 (in 3 folds),0.994 +/- 0.004 (in 3 folds),0.897 +/- 0.018 (in 3 folds),0.697 +/- 0.057 (in 3 folds),0.897,0.698,disease.separate_past_exposures,252,0,252,0.0,False
rf_multiclass.decision_thresholds_tuned,0.980 +/- 0.012 (in 3 folds),0.980 +/- 0.012 (in 3 folds),0.994 +/- 0.004 (in 3 folds),0.994 +/- 0.004 (in 3 folds),0.928 +/- 0.021 (in 3 folds),0.801 +/- 0.064 (in 3 folds),0.929,0.798,disease.separate_past_exposures,252,0,252,0.0,False
lasso_cv,0.979 +/- 0.001 (in 3 folds),0.979 +/- 0.001 (in 3 folds),0.994 +/- 0.000 (in 3 folds),0.994 +/- 0.000 (in 3 folds),0.901 +/- 0.048 (in 3 folds),0.706 +/- 0.148 (in 3 folds),0.901,0.704,disease.separate_past_exposures,252,0,252,0.0,False
lasso_cv.decision_thresholds_tuned,0.979 +/- 0.001 (in 3 folds),0.979 +/- 0.001 (in 3 folds),0.994 +/- 0.000 (in 3 folds),0.994 +/- 0.000 (in 3 folds),0.917 +/- 0.020 (in 3 folds),0.762 +/- 0.056 (in 3 folds),0.917,0.761,disease.separate_past_exposures,252,0,252,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/covid_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.hiv_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/hiv_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.934 +/- 0.016 (in 3 folds),0.934 +/- 0.016 (in 3 folds),0.972 +/- 0.007 (in 3 folds),0.972 +/- 0.007 (in 3 folds),0.747 +/- 0.073 (in 3 folds),0.335 +/- 0.291 (in 3 folds),0.747,0.392,disease.separate_past_exposures,292,0,292,0.0,False
ridge_cv.decision_thresholds_tuned,0.934 +/- 0.016 (in 3 folds),0.934 +/- 0.016 (in 3 folds),0.972 +/- 0.007 (in 3 folds),0.972 +/- 0.007 (in 3 folds),0.774 +/- 0.097 (in 3 folds),0.410 +/- 0.356 (in 3 folds),0.774,0.464,disease.separate_past_exposures,292,0,292,0.0,False
lasso_multiclass,0.930 +/- 0.014 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.970 +/- 0.007 (in 3 folds),0.970 +/- 0.007 (in 3 folds),0.857 +/- 0.056 (in 3 folds),0.714 +/- 0.099 (in 3 folds),0.856,0.71,disease.separate_past_exposures,292,0,292,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.930 +/- 0.014 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.970 +/- 0.007 (in 3 folds),0.970 +/- 0.007 (in 3 folds),0.833 +/- 0.081 (in 3 folds),0.676 +/- 0.126 (in 3 folds),0.832,0.654,disease.separate_past_exposures,292,0,292,0.0,False
linearsvm_ovr,0.928 +/- 0.011 (in 3 folds),0.928 +/- 0.011 (in 3 folds),0.968 +/- 0.006 (in 3 folds),0.968 +/- 0.006 (in 3 folds),0.853 +/- 0.028 (in 3 folds),0.690 +/- 0.052 (in 3 folds),0.853,0.689,disease.separate_past_exposures,292,0,292,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.928 +/- 0.011 (in 3 folds),0.928 +/- 0.011 (in 3 folds),0.968 +/- 0.006 (in 3 folds),0.968 +/- 0.006 (in 3 folds),0.826 +/- 0.050 (in 3 folds),0.653 +/- 0.067 (in 3 folds),0.825,0.642,disease.separate_past_exposures,292,0,292,0.0,False
lasso_cv,0.927 +/- 0.026 (in 3 folds),0.927 +/- 0.026 (in 3 folds),0.969 +/- 0.011 (in 3 folds),0.969 +/- 0.011 (in 3 folds),0.863 +/- 0.035 (in 3 folds),0.706 +/- 0.071 (in 3 folds),0.863,0.705,disease.separate_past_exposures,292,0,292,0.0,False
lasso_cv.decision_thresholds_tuned,0.927 +/- 0.026 (in 3 folds),0.927 +/- 0.026 (in 3 folds),0.969 +/- 0.011 (in 3 folds),0.969 +/- 0.011 (in 3 folds),0.840 +/- 0.081 (in 3 folds),0.700 +/- 0.116 (in 3 folds),0.839,0.686,disease.separate_past_exposures,292,0,292,0.0,False
elasticnet_cv,0.927 +/- 0.023 (in 3 folds),0.927 +/- 0.023 (in 3 folds),0.968 +/- 0.010 (in 3 folds),0.968 +/- 0.010 (in 3 folds),0.832 +/- 0.005 (in 3 folds),0.628 +/- 0.017 (in 3 folds),0.832,0.627,disease.separate_past_exposures,292,0,292,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.927 +/- 0.023 (in 3 folds),0.927 +/- 0.023 (in 3 folds),0.968 +/- 0.010 (in 3 folds),0.968 +/- 0.010 (in 3 folds),0.829 +/- 0.082 (in 3 folds),0.676 +/- 0.132 (in 3 folds),0.829,0.662,disease.separate_past_exposures,292,0,292,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/hiv_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.lupus_vs_healthy --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/lupus_vs_healthy


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.976 +/- 0.010 (in 3 folds),0.976 +/- 0.010 (in 3 folds),0.930 +/- 0.017 (in 3 folds),0.930 +/- 0.017 (in 3 folds),0.857 +/- 0.097 (in 3 folds),0.504 +/- 0.439 (in 3 folds),0.857,0.591,disease.separate_past_exposures,258,0,258,0.0,False
ridge_cv.decision_thresholds_tuned,0.976 +/- 0.010 (in 3 folds),0.976 +/- 0.010 (in 3 folds),0.930 +/- 0.017 (in 3 folds),0.930 +/- 0.017 (in 3 folds),0.873 +/- 0.109 (in 3 folds),0.550 +/- 0.477 (in 3 folds),0.872,0.635,disease.separate_past_exposures,258,0,258,0.0,False
lasso_multiclass,0.976 +/- 0.002 (in 3 folds),0.976 +/- 0.002 (in 3 folds),0.927 +/- 0.008 (in 3 folds),0.927 +/- 0.008 (in 3 folds),0.919 +/- 0.011 (in 3 folds),0.791 +/- 0.015 (in 3 folds),0.919,0.788,disease.separate_past_exposures,258,0,258,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.976 +/- 0.002 (in 3 folds),0.976 +/- 0.002 (in 3 folds),0.927 +/- 0.008 (in 3 folds),0.927 +/- 0.008 (in 3 folds),0.919 +/- 0.011 (in 3 folds),0.788 +/- 0.017 (in 3 folds),0.919,0.779,disease.separate_past_exposures,258,0,258,0.0,False
lasso_cv,0.975 +/- 0.004 (in 3 folds),0.975 +/- 0.004 (in 3 folds),0.924 +/- 0.026 (in 3 folds),0.924 +/- 0.026 (in 3 folds),0.919 +/- 0.011 (in 3 folds),0.774 +/- 0.035 (in 3 folds),0.919,0.774,disease.separate_past_exposures,258,0,258,0.0,False
lasso_cv.decision_thresholds_tuned,0.975 +/- 0.004 (in 3 folds),0.975 +/- 0.004 (in 3 folds),0.924 +/- 0.026 (in 3 folds),0.924 +/- 0.026 (in 3 folds),0.915 +/- 0.006 (in 3 folds),0.777 +/- 0.009 (in 3 folds),0.915,0.769,disease.separate_past_exposures,258,0,258,0.0,False
elasticnet_cv,0.975 +/- 0.003 (in 3 folds),0.975 +/- 0.003 (in 3 folds),0.923 +/- 0.024 (in 3 folds),0.923 +/- 0.024 (in 3 folds),0.888 +/- 0.023 (in 3 folds),0.683 +/- 0.065 (in 3 folds),0.888,0.682,disease.separate_past_exposures,258,0,258,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.975 +/- 0.003 (in 3 folds),0.975 +/- 0.003 (in 3 folds),0.923 +/- 0.024 (in 3 folds),0.923 +/- 0.024 (in 3 folds),0.919 +/- 0.011 (in 3 folds),0.796 +/- 0.018 (in 3 folds),0.919,0.791,disease.separate_past_exposures,258,0,258,0.0,False
linearsvm_ovr,0.966 +/- 0.012 (in 3 folds),0.966 +/- 0.012 (in 3 folds),0.914 +/- 0.018 (in 3 folds),0.914 +/- 0.018 (in 3 folds),0.926 +/- 0.008 (in 3 folds),0.802 +/- 0.025 (in 3 folds),0.926,0.8,disease.separate_past_exposures,258,0,258,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.966 +/- 0.012 (in 3 folds),0.966 +/- 0.012 (in 3 folds),0.914 +/- 0.018 (in 3 folds),0.914 +/- 0.018 (in 3 folds),0.930 +/- 0.011 (in 3 folds),0.818 +/- 0.018 (in 3 folds),0.93,0.811,disease.separate_past_exposures,258,0,258,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/lupus_vs_healthy/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.ethnicity_condensed_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/ethnicity_condensed_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.751 +/- 0.030 (in 3 folds),0.766 +/- 0.021 (in 3 folds),0.747 +/- 0.028 (in 3 folds),0.764 +/- 0.028 (in 3 folds),0.584 +/- 0.083 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.588,0.0,165,0,165,0.0,True
ridge_cv.decision_thresholds_tuned,0.751 +/- 0.030 (in 3 folds),0.766 +/- 0.021 (in 3 folds),0.747 +/- 0.028 (in 3 folds),0.764 +/- 0.028 (in 3 folds),0.504 +/- 0.300 (in 3 folds),0.191 +/- 0.332 (in 3 folds),0.509,0.145,165,0,165,0.0,True
linearsvm_ovr,0.734 +/- 0.071 (in 3 folds),0.747 +/- 0.077 (in 3 folds),0.761 +/- 0.060 (in 3 folds),0.780 +/- 0.071 (in 3 folds),0.705 +/- 0.050 (in 3 folds),0.469 +/- 0.123 (in 3 folds),0.703,0.465,165,0,165,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.734 +/- 0.071 (in 3 folds),0.747 +/- 0.077 (in 3 folds),0.761 +/- 0.060 (in 3 folds),0.780 +/- 0.071 (in 3 folds),0.732 +/- 0.060 (in 3 folds),0.519 +/- 0.075 (in 3 folds),0.733,0.52,165,0,165,0.0,False
lasso_multiclass,0.733 +/- 0.058 (in 3 folds),0.762 +/- 0.065 (in 3 folds),0.753 +/- 0.046 (in 3 folds),0.786 +/- 0.052 (in 3 folds),0.592 +/- 0.067 (in 3 folds),0.341 +/- 0.131 (in 3 folds),0.588,0.33,165,0,165,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.733 +/- 0.058 (in 3 folds),0.762 +/- 0.065 (in 3 folds),0.753 +/- 0.046 (in 3 folds),0.786 +/- 0.052 (in 3 folds),0.738 +/- 0.052 (in 3 folds),0.544 +/- 0.037 (in 3 folds),0.739,0.544,165,0,165,0.0,True
rf_multiclass,0.730 +/- 0.030 (in 3 folds),0.747 +/- 0.033 (in 3 folds),0.731 +/- 0.027 (in 3 folds),0.746 +/- 0.063 (in 3 folds),0.725 +/- 0.051 (in 3 folds),0.499 +/- 0.031 (in 3 folds),0.727,0.501,165,0,165,0.0,True
rf_multiclass.decision_thresholds_tuned,0.730 +/- 0.030 (in 3 folds),0.747 +/- 0.033 (in 3 folds),0.731 +/- 0.027 (in 3 folds),0.746 +/- 0.063 (in 3 folds),0.713 +/- 0.061 (in 3 folds),0.477 +/- 0.074 (in 3 folds),0.715,0.473,165,0,165,0.0,True
elasticnet_cv,0.695 +/- 0.011 (in 3 folds),0.714 +/- 0.030 (in 3 folds),0.721 +/- 0.027 (in 3 folds),0.736 +/- 0.045 (in 3 folds),0.631 +/- 0.097 (in 3 folds),0.168 +/- 0.290 (in 3 folds),0.636,0.294,165,0,165,0.0,True
elasticnet_cv.decision_thresholds_tuned,0.695 +/- 0.011 (in 3 folds),0.714 +/- 0.030 (in 3 folds),0.721 +/- 0.027 (in 3 folds),0.736 +/- 0.045 (in 3 folds),0.701 +/- 0.043 (in 3 folds),0.452 +/- 0.044 (in 3 folds),0.703,0.455,165,0,165,0.0,True


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/ethnicity_condensed_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv










GeneLocus.TCR TargetObsColumnEnum.age_group_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/age_group_healthy_only


























































































































































































































Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.746 +/- 0.042 (in 3 folds),0.731 +/- 0.045 (in 3 folds),0.771 +/- 0.044 (in 3 folds),0.758 +/- 0.051 (in 3 folds),0.439 +/- 0.063 (in 3 folds),0.338 +/- 0.068 (in 3 folds),0.436,0.326,165,0,165,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.746 +/- 0.042 (in 3 folds),0.731 +/- 0.045 (in 3 folds),0.771 +/- 0.044 (in 3 folds),0.758 +/- 0.051 (in 3 folds),0.437 +/- 0.085 (in 3 folds),0.360 +/- 0.087 (in 3 folds),0.436,0.317,165,0,165,0.0,True
lasso_multiclass,0.731 +/- 0.040 (in 3 folds),0.716 +/- 0.039 (in 3 folds),0.763 +/- 0.043 (in 3 folds),0.750 +/- 0.050 (in 3 folds),0.475 +/- 0.075 (in 3 folds),0.378 +/- 0.089 (in 3 folds),0.473,0.372,165,0,165,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.731 +/- 0.040 (in 3 folds),0.716 +/- 0.039 (in 3 folds),0.763 +/- 0.043 (in 3 folds),0.750 +/- 0.050 (in 3 folds),0.445 +/- 0.094 (in 3 folds),0.348 +/- 0.064 (in 3 folds),0.442,0.329,165,0,165,0.0,False
rf_multiclass,0.720 +/- 0.062 (in 3 folds),0.705 +/- 0.065 (in 3 folds),0.740 +/- 0.063 (in 3 folds),0.725 +/- 0.069 (in 3 folds),0.404 +/- 0.117 (in 3 folds),0.315 +/- 0.114 (in 3 folds),0.4,0.272,165,0,165,0.0,True
rf_multiclass.decision_thresholds_tuned,0.720 +/- 0.062 (in 3 folds),0.705 +/- 0.065 (in 3 folds),0.740 +/- 0.063 (in 3 folds),0.725 +/- 0.069 (in 3 folds),0.335 +/- 0.047 (in 3 folds),0.253 +/- 0.140 (in 3 folds),0.333,0.197,165,0,165,0.0,True
xgboost,0.713 +/- 0.046 (in 3 folds),0.701 +/- 0.039 (in 3 folds),0.746 +/- 0.040 (in 3 folds),0.736 +/- 0.041 (in 3 folds),0.389 +/- 0.061 (in 3 folds),0.290 +/- 0.070 (in 3 folds),0.388,0.265,165,0,165,0.0,False
xgboost.decision_thresholds_tuned,0.713 +/- 0.046 (in 3 folds),0.701 +/- 0.039 (in 3 folds),0.746 +/- 0.040 (in 3 folds),0.736 +/- 0.041 (in 3 folds),0.321 +/- 0.035 (in 3 folds),0.251 +/- 0.073 (in 3 folds),0.321,0.196,165,0,165,0.0,False
elasticnet_cv,0.676 +/- 0.033 (in 3 folds),0.663 +/- 0.024 (in 3 folds),0.719 +/- 0.023 (in 3 folds),0.708 +/- 0.031 (in 3 folds),0.308 +/- 0.088 (in 3 folds),0.268 +/- 0.082 (in 3 folds),0.309,0.162,165,0,165,0.0,True
elasticnet_cv.decision_thresholds_tuned,0.676 +/- 0.033 (in 3 folds),0.663 +/- 0.024 (in 3 folds),0.719 +/- 0.023 (in 3 folds),0.708 +/- 0.031 (in 3 folds),0.323 +/- 0.075 (in 3 folds),0.279 +/- 0.061 (in 3 folds),0.327,0.194,165,0,165,0.0,True


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/age_group_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.age_group_binary_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/age_group_binary_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.779 +/- 0.046 (in 3 folds),0.779 +/- 0.046 (in 3 folds),0.886 +/- 0.010 (in 3 folds),0.886 +/- 0.010 (in 3 folds),0.695 +/- 0.098 (in 3 folds),0.375 +/- 0.201 (in 3 folds),0.691,0.366,165,0,165,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.779 +/- 0.046 (in 3 folds),0.779 +/- 0.046 (in 3 folds),0.886 +/- 0.010 (in 3 folds),0.886 +/- 0.010 (in 3 folds),0.661 +/- 0.047 (in 3 folds),0.350 +/- 0.111 (in 3 folds),0.661,0.342,165,0,165,0.0,False
lasso_multiclass,0.776 +/- 0.051 (in 3 folds),0.776 +/- 0.051 (in 3 folds),0.885 +/- 0.014 (in 3 folds),0.885 +/- 0.014 (in 3 folds),0.669 +/- 0.076 (in 3 folds),0.323 +/- 0.138 (in 3 folds),0.667,0.315,165,0,165,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.776 +/- 0.051 (in 3 folds),0.776 +/- 0.051 (in 3 folds),0.885 +/- 0.014 (in 3 folds),0.885 +/- 0.014 (in 3 folds),0.636 +/- 0.099 (in 3 folds),0.382 +/- 0.139 (in 3 folds),0.63,0.362,165,0,165,0.0,False
rf_multiclass,0.774 +/- 0.058 (in 3 folds),0.774 +/- 0.058 (in 3 folds),0.882 +/- 0.017 (in 3 folds),0.882 +/- 0.017 (in 3 folds),0.671 +/- 0.050 (in 3 folds),0.258 +/- 0.076 (in 3 folds),0.673,0.23,165,0,165,0.0,False
rf_multiclass.decision_thresholds_tuned,0.774 +/- 0.058 (in 3 folds),0.774 +/- 0.058 (in 3 folds),0.882 +/- 0.017 (in 3 folds),0.882 +/- 0.017 (in 3 folds),0.694 +/- 0.057 (in 3 folds),0.380 +/- 0.182 (in 3 folds),0.691,0.38,165,0,165,0.0,False
xgboost,0.743 +/- 0.061 (in 3 folds),0.743 +/- 0.061 (in 3 folds),0.849 +/- 0.035 (in 3 folds),0.849 +/- 0.035 (in 3 folds),0.652 +/- 0.052 (in 3 folds),0.233 +/- 0.087 (in 3 folds),0.655,0.216,165,0,165,0.0,False
xgboost.decision_thresholds_tuned,0.743 +/- 0.061 (in 3 folds),0.743 +/- 0.061 (in 3 folds),0.849 +/- 0.035 (in 3 folds),0.849 +/- 0.035 (in 3 folds),0.707 +/- 0.082 (in 3 folds),0.429 +/- 0.135 (in 3 folds),0.703,0.412,165,0,165,0.0,False
elasticnet_cv,0.695 +/- 0.088 (in 3 folds),0.695 +/- 0.088 (in 3 folds),0.852 +/- 0.031 (in 3 folds),0.852 +/- 0.031 (in 3 folds),0.667 +/- 0.010 (in 3 folds),0.103 +/- 0.179 (in 3 folds),0.667,0.185,165,0,165,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.695 +/- 0.088 (in 3 folds),0.695 +/- 0.088 (in 3 folds),0.852 +/- 0.031 (in 3 folds),0.852 +/- 0.031 (in 3 folds),0.607 +/- 0.120 (in 3 folds),0.425 +/- 0.118 (in 3 folds),0.6,0.408,165,0,165,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/age_group_binary_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv


GeneLocus.TCR TargetObsColumnEnum.sex_healthy_only --> /users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/sex_healthy_only


Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_cv,0.495 +/- 0.009 (in 3 folds),0.495 +/- 0.009 (in 3 folds),0.556 +/- 0.056 (in 3 folds),0.556 +/- 0.056 (in 3 folds),0.543 +/- 0.068 (in 3 folds),-0.005 +/- 0.008 (in 3 folds),0.539,0.033,165,0,165,0.0,False
lasso_cv.decision_thresholds_tuned,0.495 +/- 0.009 (in 3 folds),0.495 +/- 0.009 (in 3 folds),0.556 +/- 0.056 (in 3 folds),0.556 +/- 0.056 (in 3 folds),0.463 +/- 0.073 (in 3 folds),-0.006 +/- 0.011 (in 3 folds),0.467,-0.067,165,0,165,0.0,False
ridge_cv,0.490 +/- 0.017 (in 3 folds),0.490 +/- 0.017 (in 3 folds),0.554 +/- 0.057 (in 3 folds),0.554 +/- 0.057 (in 3 folds),0.549 +/- 0.062 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.545,0.072,165,0,165,0.0,False
ridge_cv.decision_thresholds_tuned,0.490 +/- 0.017 (in 3 folds),0.490 +/- 0.017 (in 3 folds),0.554 +/- 0.057 (in 3 folds),0.554 +/- 0.057 (in 3 folds),0.543 +/- 0.068 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.539,0.0,165,0,165,0.0,True
elasticnet_cv,0.467 +/- 0.045 (in 3 folds),0.467 +/- 0.045 (in 3 folds),0.536 +/- 0.022 (in 3 folds),0.536 +/- 0.022 (in 3 folds),0.537 +/- 0.075 (in 3 folds),-0.016 +/- 0.028 (in 3 folds),0.533,0.014,165,0,165,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.467 +/- 0.045 (in 3 folds),0.467 +/- 0.045 (in 3 folds),0.536 +/- 0.022 (in 3 folds),0.536 +/- 0.022 (in 3 folds),0.456 +/- 0.085 (in 3 folds),-0.056 +/- 0.081 (in 3 folds),0.461,-0.082,165,0,165,0.0,False
linearsvm_ovr,0.464 +/- 0.033 (in 3 folds),0.464 +/- 0.033 (in 3 folds),0.534 +/- 0.061 (in 3 folds),0.534 +/- 0.061 (in 3 folds),0.445 +/- 0.048 (in 3 folds),-0.099 +/- 0.113 (in 3 folds),0.442,-0.11,165,0,165,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.464 +/- 0.033 (in 3 folds),0.464 +/- 0.033 (in 3 folds),0.534 +/- 0.061 (in 3 folds),0.534 +/- 0.061 (in 3 folds),0.440 +/- 0.079 (in 3 folds),-0.109 +/- 0.101 (in 3 folds),0.442,-0.104,165,0,165,0.0,False
lasso_multiclass,0.457 +/- 0.053 (in 3 folds),0.457 +/- 0.053 (in 3 folds),0.530 +/- 0.072 (in 3 folds),0.530 +/- 0.072 (in 3 folds),0.449 +/- 0.080 (in 3 folds),-0.090 +/- 0.173 (in 3 folds),0.448,-0.097,165,0,165,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.457 +/- 0.053 (in 3 folds),0.457 +/- 0.053 (in 3 folds),0.530 +/- 0.072 (in 3 folds),0.530 +/- 0.072 (in 3 folds),0.452 +/- 0.063 (in 3 folds),-0.046 +/- 0.040 (in 3 folds),0.455,-0.079,165,0,165,0.0,False


/users/maximz/code/boyd-immune-repertoire-classification/out/repertoire_stats/TCR/sex_healthy_only/train_smaller_model.compare_model_scores.test_set_performance.tsv
