In [1]:
from summarynb import show, indexed_csv, table, chunks
from malid.external.summarynb_extras import plaintext, empty
from malid import config, helpers, logger
from malid.datamodels import (
    TargetObsColumnEnum,
    combine_classification_option_names,
)
import pandas as pd
from IPython.display import display, Markdown

# Convergent sequence cluster classifiers


### Distance thresholds

#### Clustering training set:

In [2]:
config.sequence_identity_thresholds.cluster_amino_acids_across_patients

{<GeneLocus.BCR: 1>: 0.85, <GeneLocus.TCR: 2>: 0.9}

#### Assigning test sequences to clusters:

In [3]:
config.sequence_identity_thresholds.assign_test_sequences_to_clusters

{<GeneLocus.BCR: 1>: 0.85, <GeneLocus.TCR: 2>: 0.9}

In [4]:
fold_label_train, fold_label_validation = config.get_fold_split_labels()

In [5]:
for gene_locus in config.gene_loci_used:
    # map target_obs_column to results_output_prefix
    targets = {}
    for target in config.classification_targets:
        targets[target] = (
            config.paths.convergent_clusters_output_dir
            / gene_locus.name
            / combine_classification_option_names(target)
            / "train_smaller_model"
        )

    print(targets)

    for target_obs_column, results_output_prefix in targets.items():
        display(
            Markdown(
                f"# {gene_locus}, {target_obs_column} trained on {fold_label_train} set"
            )
        )

        display(Markdown(f"## Specimen predictions on {fold_label_validation} set"))
        try:
            ## All results in a table
            all_results = pd.read_csv(
                f"{results_output_prefix}.compare_model_scores.tsv",
                sep="\t",
                index_col=0,
            )
            show(table(all_results), headers=["All results, sorted"])

            models_of_interest = all_results.index

            ## Confusion matrices
            for model_names in chunks(models_of_interest, 4):
                show(
                    [
                        [
                            plaintext(
                                f"{results_output_prefix}.classification_report.{model_name}.txt"
                            )
                            for model_name in model_names
                        ],
                        [
                            f"{results_output_prefix}.confusion_matrix.{model_name}.png"
                            for model_name in model_names
                        ],
                    ],
                    headers=model_names,
                    max_width=500,
                )
        except FileNotFoundError as err:
            logger.warning(f"Not run: {err}")

        display(
            Markdown(
                "## Apply train-smaller model -- Test set performance - With and without tuning on validation set"
            )
        )
        try:
            ## All results in a table
            all_results = pd.read_csv(
                f"{results_output_prefix}.compare_model_scores.test_set_performance.tsv",
                sep="\t",
                index_col=0,
            )
            show(table(all_results), headers=["All results, sorted"])

            models_of_interest = all_results.index

            ## Confusion matrices
            for model_names in chunks(models_of_interest, 4):
                show(
                    [
                        [
                            plaintext(
                                f"{results_output_prefix}.test_set_performance.{model_name}.classification_report.txt"
                            )
                            for model_name in model_names
                        ],
                        [
                            f"{results_output_prefix}.test_set_performance.{model_name}.confusion_matrix.png"
                            for model_name in model_names
                        ],
                    ],
                    max_width=500,
                    headers=model_names,
                )
        except FileNotFoundError as err:
            logger.warning(f"Not run: {err}")

        display(Markdown("---"))

{<TargetObsColumnEnum.disease: TargetObsColumn(obs_column_name='disease', is_target_binary_for_repertoire_composition_classifier=False, limited_to_disease=None, require_metadata_columns_present=None, confusion_matrix_expanded_column_name='disease.separate_past_exposures', blended_evaluation_column_name='disease.rollup')>: PosixPath('/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/disease/train_smaller_model'), <TargetObsColumnEnum.disease_all_demographics_present: TargetObsColumn(obs_column_name='disease', is_target_binary_for_repertoire_composition_classifier=False, limited_to_disease=None, require_metadata_columns_present=['age', 'sex', 'ethnicity_condensed', 'age_group'], confusion_matrix_expanded_column_name='disease.separate_past_exposures', blended_evaluation_column_name='disease.rollup')>: PosixPath('/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/BCR/disease_all_demographics_present/train_smaller_model'), <Ta

# GeneLocus.BCR, TargetObsColumnEnum.disease trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.912 +/- 0.010 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.917 +/- 0.004 (in 3 folds),0.930 +/- 0.004 (in 3 folds),0.750 +/- 0.010 (in 3 folds),0.641 +/- 0.021 (in 3 folds),0.75,0.637,0.743 +/- 0.019 (in 3 folds),0.633 +/- 0.027 (in 3 folds),0.028 +/- 0.000 (in 1 folds),0.912 +/- 0.014 (in 2 folds),0.924 +/- 0.013 (in 2 folds),0.918 +/- 0.005 (in 2 folds),0.931 +/- 0.005 (in 2 folds),0.743,0.628,0.009,Unknown,320.0,3.0,323.0,0.009288,False
linearsvm_ovr,0.912 +/- 0.004 (in 3 folds),0.922 +/- 0.004 (in 3 folds),0.919 +/- 0.007 (in 3 folds),0.931 +/- 0.006 (in 3 folds),0.754 +/- 0.012 (in 3 folds),0.647 +/- 0.017 (in 3 folds),0.754,0.643,0.749 +/- 0.005 (in 3 folds),0.642 +/- 0.008 (in 3 folds),0.018 +/- 0.000 (in 1 folds),0.913 +/- 0.005 (in 2 folds),0.924 +/- 0.004 (in 2 folds),0.923 +/- 0.005 (in 2 folds),0.934 +/- 0.004 (in 2 folds),0.749,0.638,0.006,Unknown,321.0,2.0,323.0,0.006192,False
ridge_cv,0.903 +/- 0.002 (in 3 folds),0.915 +/- 0.003 (in 3 folds),0.905 +/- 0.006 (in 3 folds),0.920 +/- 0.002 (in 3 folds),0.563 +/- 0.077 (in 3 folds),0.337 +/- 0.138 (in 3 folds),0.562,0.344,0.561 +/- 0.078 (in 3 folds),0.335 +/- 0.138 (in 3 folds),0.009 +/- 0.000 (in 1 folds),0.902 +/- 0.001 (in 2 folds),0.916 +/- 0.004 (in 2 folds),0.903 +/- 0.007 (in 2 folds),0.920 +/- 0.003 (in 2 folds),0.56,0.342,0.003,Unknown,322.0,1.0,323.0,0.003096,False
lasso_cv,0.897 +/- 0.017 (in 3 folds),0.907 +/- 0.018 (in 3 folds),0.903 +/- 0.012 (in 3 folds),0.916 +/- 0.012 (in 3 folds),0.532 +/- 0.035 (in 3 folds),0.284 +/- 0.068 (in 3 folds),0.531,0.287,0.524 +/- 0.041 (in 3 folds),0.266 +/- 0.089 (in 3 folds),0.023 +/- 0.006 (in 2 folds),0.896 +/- 0.000 (in 1 folds),0.909 +/- 0.000 (in 1 folds),0.907 +/- 0.000 (in 1 folds),0.921 +/- 0.000 (in 1 folds),0.523,0.268,0.015,Unknown,318.0,5.0,323.0,0.01548,True
rf_multiclass,0.889 +/- 0.024 (in 3 folds),0.896 +/- 0.025 (in 3 folds),0.885 +/- 0.024 (in 3 folds),0.894 +/- 0.023 (in 3 folds),0.740 +/- 0.022 (in 3 folds),0.616 +/- 0.034 (in 3 folds),0.74,0.613,0.731 +/- 0.032 (in 3 folds),0.606 +/- 0.046 (in 3 folds),0.018 +/- 0.013 (in 2 folds),0.879 +/- 0.000 (in 1 folds),0.886 +/- 0.000 (in 1 folds),0.878 +/- 0.000 (in 1 folds),0.888 +/- 0.000 (in 1 folds),0.731,0.602,0.012,Unknown,319.0,4.0,323.0,0.012384,False
xgboost,0.882 +/- 0.009 (in 3 folds),0.887 +/- 0.009 (in 3 folds),0.883 +/- 0.009 (in 3 folds),0.892 +/- 0.008 (in 3 folds),0.721 +/- 0.007 (in 3 folds),0.587 +/- 0.004 (in 3 folds),0.721,0.583,0.712 +/- 0.010 (in 3 folds),0.577 +/- 0.010 (in 3 folds),0.018 +/- 0.013 (in 2 folds),0.891 +/- 0.000 (in 1 folds),0.897 +/- 0.000 (in 1 folds),0.893 +/- 0.000 (in 1 folds),0.901 +/- 0.000 (in 1 folds),0.712,0.573,0.012,Unknown,319.0,4.0,323.0,0.012384,False
elasticnet_cv,0.878 +/- 0.023 (in 3 folds),0.891 +/- 0.019 (in 3 folds),0.891 +/- 0.020 (in 3 folds),0.906 +/- 0.017 (in 3 folds),0.590 +/- 0.129 (in 3 folds),0.370 +/- 0.219 (in 3 folds),0.589,0.386,0.587 +/- 0.133 (in 3 folds),0.368 +/- 0.223 (in 3 folds),0.018 +/- 0.000 (in 1 folds),0.875 +/- 0.033 (in 2 folds),0.891 +/- 0.027 (in 2 folds),0.890 +/- 0.028 (in 2 folds),0.906 +/- 0.024 (in 2 folds),0.585,0.382,0.006,Unknown,321.0,2.0,323.0,0.006192,False
dummy_stratified,0.536 +/- 0.032 (in 3 folds),0.543 +/- 0.036 (in 3 folds),0.529 +/- 0.020 (in 3 folds),0.535 +/- 0.024 (in 3 folds),0.378 +/- 0.047 (in 3 folds),0.066 +/- 0.060 (in 3 folds),0.377,0.064,0.366 +/- 0.040 (in 3 folds),0.064 +/- 0.055 (in 3 folds),0.031 +/- 0.015 (in 3 folds),,,,,0.365,0.063,0.031,Unknown,313.0,10.0,323.0,0.03096,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.467 +/- 0.016 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.466,0.0,0.452 +/- 0.010 (in 3 folds),0.028 +/- 0.020 (in 3 folds),0.031 +/- 0.015 (in 3 folds),,,,,0.452,0.025,0.031,Unknown,313.0,10.0,323.0,0.03096,True
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.912 +/- 0.010 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.917 +/- 0.004 (in 3 folds),0.930 +/- 0.004 (in 3 folds),0.750 +/- 0.010 (in 3 folds),0.641 +/- 0.021 (in 3 folds),0.75,0.637,0.743 +/- 0.019 (in 3 folds),0.633 +/- 0.027 (in 3 folds),0.028 +/- 0.000 (in 1 folds),0.912 +/- 0.014 (in 2 folds),0.924 +/- 0.013 (in 2 folds),0.918 +/- 0.005 (in 2 folds),0.931 +/- 0.005 (in 2 folds),0.743,0.628,0.009,Unknown,320,3,323,0.009288,False
linearsvm_ovr,0.912 +/- 0.004 (in 3 folds),0.922 +/- 0.004 (in 3 folds),0.919 +/- 0.007 (in 3 folds),0.931 +/- 0.006 (in 3 folds),0.754 +/- 0.012 (in 3 folds),0.647 +/- 0.017 (in 3 folds),0.754,0.643,0.749 +/- 0.005 (in 3 folds),0.642 +/- 0.008 (in 3 folds),0.018 +/- 0.000 (in 1 folds),0.913 +/- 0.005 (in 2 folds),0.924 +/- 0.004 (in 2 folds),0.923 +/- 0.005 (in 2 folds),0.934 +/- 0.004 (in 2 folds),0.749,0.638,0.006,Unknown,321,2,323,0.006192,False
ridge_cv,0.903 +/- 0.002 (in 3 folds),0.915 +/- 0.003 (in 3 folds),0.905 +/- 0.006 (in 3 folds),0.920 +/- 0.002 (in 3 folds),0.563 +/- 0.077 (in 3 folds),0.337 +/- 0.138 (in 3 folds),0.562,0.344,0.561 +/- 0.078 (in 3 folds),0.335 +/- 0.138 (in 3 folds),0.009 +/- 0.000 (in 1 folds),0.902 +/- 0.001 (in 2 folds),0.916 +/- 0.004 (in 2 folds),0.903 +/- 0.007 (in 2 folds),0.920 +/- 0.003 (in 2 folds),0.56,0.342,0.003,Unknown,322,1,323,0.003096,False
lasso_cv,0.897 +/- 0.017 (in 3 folds),0.907 +/- 0.018 (in 3 folds),0.903 +/- 0.012 (in 3 folds),0.916 +/- 0.012 (in 3 folds),0.532 +/- 0.035 (in 3 folds),0.284 +/- 0.068 (in 3 folds),0.531,0.287,0.524 +/- 0.041 (in 3 folds),0.266 +/- 0.089 (in 3 folds),0.023 +/- 0.006 (in 2 folds),0.896 +/- 0.000 (in 1 folds),0.909 +/- 0.000 (in 1 folds),0.907 +/- 0.000 (in 1 folds),0.921 +/- 0.000 (in 1 folds),0.523,0.268,0.015,Unknown,318,5,323,0.01548,True
rf_multiclass,0.889 +/- 0.024 (in 3 folds),0.896 +/- 0.025 (in 3 folds),0.885 +/- 0.024 (in 3 folds),0.894 +/- 0.023 (in 3 folds),0.740 +/- 0.022 (in 3 folds),0.616 +/- 0.034 (in 3 folds),0.74,0.613,0.731 +/- 0.032 (in 3 folds),0.606 +/- 0.046 (in 3 folds),0.018 +/- 0.013 (in 2 folds),0.879 +/- 0.000 (in 1 folds),0.886 +/- 0.000 (in 1 folds),0.878 +/- 0.000 (in 1 folds),0.888 +/- 0.000 (in 1 folds),0.731,0.602,0.012,Unknown,319,4,323,0.012384,False
xgboost,0.882 +/- 0.009 (in 3 folds),0.887 +/- 0.009 (in 3 folds),0.883 +/- 0.009 (in 3 folds),0.892 +/- 0.008 (in 3 folds),0.721 +/- 0.007 (in 3 folds),0.587 +/- 0.004 (in 3 folds),0.721,0.583,0.712 +/- 0.010 (in 3 folds),0.577 +/- 0.010 (in 3 folds),0.018 +/- 0.013 (in 2 folds),0.891 +/- 0.000 (in 1 folds),0.897 +/- 0.000 (in 1 folds),0.893 +/- 0.000 (in 1 folds),0.901 +/- 0.000 (in 1 folds),0.712,0.573,0.012,Unknown,319,4,323,0.012384,False
elasticnet_cv,0.878 +/- 0.023 (in 3 folds),0.891 +/- 0.019 (in 3 folds),0.891 +/- 0.020 (in 3 folds),0.906 +/- 0.017 (in 3 folds),0.590 +/- 0.129 (in 3 folds),0.370 +/- 0.219 (in 3 folds),0.589,0.386,0.587 +/- 0.133 (in 3 folds),0.368 +/- 0.223 (in 3 folds),0.018 +/- 0.000 (in 1 folds),0.875 +/- 0.033 (in 2 folds),0.891 +/- 0.027 (in 2 folds),0.890 +/- 0.028 (in 2 folds),0.906 +/- 0.024 (in 2 folds),0.585,0.382,0.006,Unknown,321,2,323,0.006192,False
dummy_stratified,0.536 +/- 0.032 (in 3 folds),0.543 +/- 0.036 (in 3 folds),0.529 +/- 0.020 (in 3 folds),0.535 +/- 0.024 (in 3 folds),0.378 +/- 0.047 (in 3 folds),0.066 +/- 0.060 (in 3 folds),0.377,0.064,0.366 +/- 0.040 (in 3 folds),0.064 +/- 0.055 (in 3 folds),0.031 +/- 0.015 (in 3 folds),,,,,0.365,0.063,0.031,Unknown,313,10,323,0.03096,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.467 +/- 0.016 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.466,0.0,0.452 +/- 0.010 (in 3 folds),0.028 +/- 0.020 (in 3 folds),0.031 +/- 0.015 (in 3 folds),,,,,0.452,0.025,0.031,Unknown,313,10,323,0.03096,True


lasso_multiclass,linearsvm_ovr,ridge_cv,lasso_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.912 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.923 +/- 0.009 (in 3 folds) au-PRC (weighted OvO): 0.917 +/- 0.004 (in 3 folds) au-PRC (macro OvO): 0.930 +/- 0.004 (in 3 folds) Accuracy: 0.750 +/- 0.010 (in 3 folds) MCC: 0.641 +/- 0.021 (in 3 folds) Global scores without abstention: Accuracy: 0.750 MCC: 0.637 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.912 +/- 0.014 (in 2 folds) ROC-AUC (macro OvO): 0.924 +/- 0.013 (in 2 folds) au-PRC (weighted OvO): 0.918 +/- 0.005 (in 2 folds) au-PRC (macro OvO): 0.931 +/- 0.005 (in 2 folds) Accuracy: 0.743 +/- 0.019 (in 3 folds) MCC: 0.633 +/- 0.027 (in 3 folds) Unknown/abstention proportion: 0.028 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.743 MCC: 0.628 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.79 0.88 0.83 42  HIV 0.85 0.86 0.85 64 Healthy/Background 0.77 0.77 0.77 149  Lupus 0.57 0.50 0.53 68  Unknown 0.00 0.00 0.00 0  accuracy 0.74 323  macro avg 0.59 0.60 0.60 323  weighted avg 0.74 0.74 0.74 323,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.912 +/- 0.004 (in 3 folds) ROC-AUC (macro OvO): 0.922 +/- 0.004 (in 3 folds) au-PRC (weighted OvO): 0.919 +/- 0.007 (in 3 folds) au-PRC (macro OvO): 0.931 +/- 0.006 (in 3 folds) Accuracy: 0.754 +/- 0.012 (in 3 folds) MCC: 0.647 +/- 0.017 (in 3 folds) Global scores without abstention: Accuracy: 0.754 MCC: 0.643 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.913 +/- 0.005 (in 2 folds) ROC-AUC (macro OvO): 0.924 +/- 0.004 (in 2 folds) au-PRC (weighted OvO): 0.923 +/- 0.005 (in 2 folds) au-PRC (macro OvO): 0.934 +/- 0.004 (in 2 folds) Accuracy: 0.749 +/- 0.005 (in 3 folds) MCC: 0.642 +/- 0.008 (in 3 folds) Unknown/abstention proportion: 0.018 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.749 MCC: 0.638 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.79 0.88 0.83 42  HIV 0.84 0.88 0.85 64 Healthy/Background 0.78 0.77 0.77 149  Lupus 0.57 0.51 0.54 68  Unknown 0.00 0.00 0.00 0  accuracy 0.75 323  macro avg 0.60 0.61 0.60 323  weighted avg 0.75 0.75 0.75 323,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.903 +/- 0.002 (in 3 folds) ROC-AUC (macro OvO): 0.915 +/- 0.003 (in 3 folds) au-PRC (weighted OvO): 0.905 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.920 +/- 0.002 (in 3 folds) Accuracy: 0.563 +/- 0.077 (in 3 folds) MCC: 0.337 +/- 0.138 (in 3 folds) Global scores without abstention: Accuracy: 0.562 MCC: 0.344 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.902 +/- 0.001 (in 2 folds) ROC-AUC (macro OvO): 0.916 +/- 0.004 (in 2 folds) au-PRC (weighted OvO): 0.903 +/- 0.007 (in 2 folds) au-PRC (macro OvO): 0.920 +/- 0.003 (in 2 folds) Accuracy: 0.561 +/- 0.078 (in 3 folds) MCC: 0.335 +/- 0.138 (in 3 folds) Unknown/abstention proportion: 0.009 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.560 MCC: 0.342 Unknown/abstention proportion: 0.003 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 1.00 0.17 0.29 42  HIV 0.95 0.31 0.47 64 Healthy/Background 0.52 0.99 0.68 149  Lupus 0.78 0.10 0.18 68  Unknown 0.00 0.00 0.00 0  accuracy 0.56 323  macro avg 0.65 0.31 0.32 323  weighted avg 0.72 0.56 0.48 323,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.897 +/- 0.017 (in 3 folds) ROC-AUC (macro OvO): 0.907 +/- 0.018 (in 3 folds) au-PRC (weighted OvO): 0.903 +/- 0.012 (in 3 folds) au-PRC (macro OvO): 0.916 +/- 0.012 (in 3 folds) Accuracy: 0.532 +/- 0.035 (in 3 folds) MCC: 0.284 +/- 0.068 (in 3 folds) Global scores without abstention: Accuracy: 0.531 MCC: 0.287 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.524 +/- 0.041 (in 3 folds) MCC: 0.266 +/- 0.089 (in 3 folds) Unknown/abstention proportion: 0.023 +/- 0.006 (in 2 folds) ROC-AUC (weighted OvO): 0.896 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.909 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.907 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.921 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.523 MCC: 0.268 Unknown/abstention proportion: 0.015 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.00 0.00 0.00 42  HIV 1.00 0.33 0.49 64 Healthy/Background 0.50 0.99 0.66 149  Lupus 0.00 0.00 0.00 68  Unknown 0.00 0.00 0.00 0  accuracy 0.52 323  macro avg 0.30 0.26 0.23 323  weighted avg 0.43 0.52 0.40 323
,,,


rf_multiclass,xgboost,elasticnet_cv,dummy_stratified
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.889 +/- 0.024 (in 3 folds) ROC-AUC (macro OvO): 0.896 +/- 0.025 (in 3 folds) au-PRC (weighted OvO): 0.885 +/- 0.024 (in 3 folds) au-PRC (macro OvO): 0.894 +/- 0.023 (in 3 folds) Accuracy: 0.740 +/- 0.022 (in 3 folds) MCC: 0.616 +/- 0.034 (in 3 folds) Global scores without abstention: Accuracy: 0.740 MCC: 0.613 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.731 +/- 0.032 (in 3 folds) MCC: 0.606 +/- 0.046 (in 3 folds) Unknown/abstention proportion: 0.018 +/- 0.013 (in 2 folds) ROC-AUC (weighted OvO): 0.879 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.886 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.878 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.888 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.731 MCC: 0.602 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.91 0.74 0.82 42  HIV 0.86 0.78 0.82 64 Healthy/Background 0.75 0.83 0.79 149  Lupus 0.51 0.46 0.48 68  Unknown 0.00 0.00 0.00 0  accuracy 0.73 323  macro avg 0.61 0.56 0.58 323  weighted avg 0.74 0.73 0.73 323,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.882 +/- 0.009 (in 3 folds) ROC-AUC (macro OvO): 0.887 +/- 0.009 (in 3 folds) au-PRC (weighted OvO): 0.883 +/- 0.009 (in 3 folds) au-PRC (macro OvO): 0.892 +/- 0.008 (in 3 folds) Accuracy: 0.721 +/- 0.007 (in 3 folds) MCC: 0.587 +/- 0.004 (in 3 folds) Global scores without abstention: Accuracy: 0.721 MCC: 0.583 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.712 +/- 0.010 (in 3 folds) MCC: 0.577 +/- 0.010 (in 3 folds) Unknown/abstention proportion: 0.018 +/- 0.013 (in 2 folds) ROC-AUC (weighted OvO): 0.891 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.897 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.893 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.901 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.712 MCC: 0.573 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.88 0.69 0.77 42  HIV 0.87 0.72 0.79 64 Healthy/Background 0.72 0.84 0.78 149  Lupus 0.50 0.44 0.47 68  Unknown 0.00 0.00 0.00 0  accuracy 0.71 323  macro avg 0.59 0.54 0.56 323  weighted avg 0.72 0.71 0.71 323,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.878 +/- 0.023 (in 3 folds) ROC-AUC (macro OvO): 0.891 +/- 0.019 (in 3 folds) au-PRC (weighted OvO): 0.891 +/- 0.020 (in 3 folds) au-PRC (macro OvO): 0.906 +/- 0.017 (in 3 folds) Accuracy: 0.590 +/- 0.129 (in 3 folds) MCC: 0.370 +/- 0.219 (in 3 folds) Global scores without abstention: Accuracy: 0.589 MCC: 0.386 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.875 +/- 0.033 (in 2 folds) ROC-AUC (macro OvO): 0.891 +/- 0.027 (in 2 folds) au-PRC (weighted OvO): 0.890 +/- 0.028 (in 2 folds) au-PRC (macro OvO): 0.906 +/- 0.024 (in 2 folds) Accuracy: 0.587 +/- 0.133 (in 3 folds) MCC: 0.368 +/- 0.223 (in 3 folds) Unknown/abstention proportion: 0.018 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.585 MCC: 0.382 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 1.00 0.36 0.53 42  HIV 1.00 0.28 0.44 64 Healthy/Background 0.53 0.97 0.69 149  Lupus 0.71 0.18 0.28 68  Unknown 0.00 0.00 0.00 0  accuracy 0.59 323  macro avg 0.65 0.36 0.39 323  weighted avg 0.72 0.59 0.53 323,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.536 +/- 0.032 (in 3 folds) ROC-AUC (macro OvO): 0.543 +/- 0.036 (in 3 folds) au-PRC (weighted OvO): 0.529 +/- 0.020 (in 3 folds) au-PRC (macro OvO): 0.535 +/- 0.024 (in 3 folds) Accuracy: 0.378 +/- 0.047 (in 3 folds) MCC: 0.066 +/- 0.060 (in 3 folds) Global scores without abstention: Accuracy: 0.377 MCC: 0.064 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.366 +/- 0.040 (in 3 folds) MCC: 0.064 +/- 0.055 (in 3 folds) Unknown/abstention proportion: 0.031 +/- 0.015 (in 3 folds) Global scores with abstention: Accuracy: 0.365 MCC: 0.063 Unknown/abstention proportion: 0.031 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.30 0.24 0.27 42  HIV 0.22 0.25 0.23 64 Healthy/Background 0.47 0.53 0.50 149  Lupus 0.33 0.19 0.24 68  Unknown 0.00 0.00 0.00 0  accuracy 0.37 323  macro avg 0.27 0.24 0.25 323  weighted avg 0.37 0.37 0.36 323
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 3 folds) Accuracy: 0.467 +/- 0.016 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.466 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.452 +/- 0.010 (in 3 folds) MCC: 0.028 +/- 0.020 (in 3 folds) Unknown/abstention proportion: 0.031 +/- 0.015 (in 3 folds) Global scores with abstention: Accuracy: 0.452 MCC: 0.025 Unknown/abstention proportion: 0.031 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.00 0.00 0.00 42  HIV 0.00 0.00 0.00 64 Healthy/Background 0.47 0.98 0.63 149  Lupus 0.00 0.00 0.00 68  Unknown 0.00 0.00 0.00 0  accuracy 0.45 323  macro avg 0.09 0.20 0.13 323  weighted avg 0.22 0.45 0.29 323


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.929 +/- 0.007 (in 3 folds),0.936 +/- 0.007 (in 3 folds),0.931 +/- 0.008 (in 3 folds),0.939 +/- 0.008 (in 3 folds),0.766 +/- 0.010 (in 3 folds),0.655 +/- 0.012 (in 3 folds),0.765,0.654,disease.separate_past_exposures,0.754 +/- 0.015 (in 3 folds),0.642 +/- 0.020 (in 3 folds),0.022 +/- 0.022 (in 2 folds),0.931 +/- 0.000 (in 1 folds),0.940 +/- 0.000 (in 1 folds),0.938 +/- 0.000 (in 1 folds),0.946 +/- 0.000 (in 1 folds),0.754,0.64,0.015,Unknown,disease.separate_past_exposures,473.0,7.0,480.0,0.014583,False
linearsvm_ovr.decision_thresholds_tuned,0.929 +/- 0.007 (in 3 folds),0.936 +/- 0.007 (in 3 folds),0.931 +/- 0.008 (in 3 folds),0.939 +/- 0.008 (in 3 folds),0.757 +/- 0.007 (in 3 folds),0.647 +/- 0.008 (in 3 folds),0.757,0.641,disease.separate_past_exposures,0.746 +/- 0.014 (in 3 folds),0.634 +/- 0.017 (in 3 folds),0.022 +/- 0.022 (in 2 folds),0.931 +/- 0.000 (in 1 folds),0.940 +/- 0.000 (in 1 folds),0.938 +/- 0.000 (in 1 folds),0.946 +/- 0.000 (in 1 folds),0.746,0.628,0.015,Unknown,disease.separate_past_exposures,473.0,7.0,480.0,0.014583,False
lasso_multiclass,0.926 +/- 0.009 (in 3 folds),0.933 +/- 0.010 (in 3 folds),0.927 +/- 0.014 (in 3 folds),0.935 +/- 0.014 (in 3 folds),0.761 +/- 0.010 (in 3 folds),0.650 +/- 0.022 (in 3 folds),0.761,0.649,disease.separate_past_exposures,0.744 +/- 0.031 (in 3 folds),0.630 +/- 0.046 (in 3 folds),0.034 +/- 0.030 (in 2 folds),0.931 +/- 0.000 (in 1 folds),0.940 +/- 0.000 (in 1 folds),0.935 +/- 0.000 (in 1 folds),0.945 +/- 0.000 (in 1 folds),0.744,0.628,0.023,Unknown,disease.separate_past_exposures,469.0,11.0,480.0,0.022917,False
lasso_multiclass.decision_thresholds_tuned,0.926 +/- 0.009 (in 3 folds),0.933 +/- 0.010 (in 3 folds),0.927 +/- 0.014 (in 3 folds),0.935 +/- 0.014 (in 3 folds),0.754 +/- 0.044 (in 3 folds),0.643 +/- 0.059 (in 3 folds),0.755,0.639,disease.separate_past_exposures,0.738 +/- 0.063 (in 3 folds),0.619 +/- 0.089 (in 3 folds),0.034 +/- 0.030 (in 2 folds),0.931 +/- 0.000 (in 1 folds),0.940 +/- 0.000 (in 1 folds),0.935 +/- 0.000 (in 1 folds),0.945 +/- 0.000 (in 1 folds),0.738,0.617,0.023,Unknown,disease.separate_past_exposures,469.0,11.0,480.0,0.022917,False
lasso_cv,0.909 +/- 0.014 (in 3 folds),0.918 +/- 0.015 (in 3 folds),0.914 +/- 0.008 (in 3 folds),0.923 +/- 0.008 (in 3 folds),0.544 +/- 0.017 (in 3 folds),0.317 +/- 0.047 (in 3 folds),0.543,0.318,disease.separate_past_exposures,0.523 +/- 0.016 (in 3 folds),0.267 +/- 0.052 (in 3 folds),0.057 +/- 0.028 (in 2 folds),0.902 +/- 0.000 (in 1 folds),0.914 +/- 0.000 (in 1 folds),0.912 +/- 0.000 (in 1 folds),0.924 +/- 0.000 (in 1 folds),0.523,0.261,0.037,Unknown,disease.separate_past_exposures,462.0,18.0,480.0,0.0375,False
lasso_cv.decision_thresholds_tuned,0.909 +/- 0.014 (in 3 folds),0.918 +/- 0.015 (in 3 folds),0.914 +/- 0.008 (in 3 folds),0.923 +/- 0.008 (in 3 folds),0.758 +/- 0.014 (in 3 folds),0.644 +/- 0.024 (in 3 folds),0.758,0.643,disease.separate_past_exposures,0.729 +/- 0.033 (in 3 folds),0.606 +/- 0.047 (in 3 folds),0.057 +/- 0.028 (in 2 folds),0.902 +/- 0.000 (in 1 folds),0.914 +/- 0.000 (in 1 folds),0.912 +/- 0.000 (in 1 folds),0.924 +/- 0.000 (in 1 folds),0.729,0.605,0.037,Unknown,disease.separate_past_exposures,462.0,18.0,480.0,0.0375,False
elasticnet_cv,0.909 +/- 0.011 (in 3 folds),0.916 +/- 0.011 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.610 +/- 0.132 (in 3 folds),0.390 +/- 0.278 (in 3 folds),0.612,0.44,disease.separate_past_exposures,0.604 +/- 0.141 (in 3 folds),0.379 +/- 0.297 (in 3 folds),0.037 +/- 0.000 (in 1 folds),0.914 +/- 0.010 (in 2 folds),0.921 +/- 0.010 (in 2 folds),0.918 +/- 0.008 (in 2 folds),0.928 +/- 0.007 (in 2 folds),0.604,0.424,0.013,Unknown,disease.separate_past_exposures,474.0,6.0,480.0,0.0125,False
elasticnet_cv.decision_thresholds_tuned,0.909 +/- 0.011 (in 3 folds),0.916 +/- 0.011 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.738 +/- 0.054 (in 3 folds),0.633 +/- 0.052 (in 3 folds),0.738,0.623,disease.separate_past_exposures,0.728 +/- 0.053 (in 3 folds),0.621 +/- 0.057 (in 3 folds),0.037 +/- 0.000 (in 1 folds),0.914 +/- 0.010 (in 2 folds),0.921 +/- 0.010 (in 2 folds),0.918 +/- 0.008 (in 2 folds),0.928 +/- 0.007 (in 2 folds),0.729,0.612,0.013,Unknown,disease.separate_past_exposures,474.0,6.0,480.0,0.0125,False
ridge_cv,0.907 +/- 0.010 (in 3 folds),0.917 +/- 0.011 (in 3 folds),0.914 +/- 0.006 (in 3 folds),0.924 +/- 0.006 (in 3 folds),0.576 +/- 0.065 (in 3 folds),0.371 +/- 0.124 (in 3 folds),0.577,0.383,disease.separate_past_exposures,0.572 +/- 0.068 (in 3 folds),0.362 +/- 0.131 (in 3 folds),0.009 +/- 0.004 (in 2 folds),0.913 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds),0.920 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds),0.573,0.374,0.006,Unknown,disease.separate_past_exposures,477.0,3.0,480.0,0.00625,False
ridge_cv.decision_thresholds_tuned,0.907 +/- 0.010 (in 3 folds),0.917 +/- 0.011 (in 3 folds),0.914 +/- 0.006 (in 3 folds),0.924 +/- 0.006 (in 3 folds),0.761 +/- 0.033 (in 3 folds),0.653 +/- 0.056 (in 3 folds),0.761,0.652,disease.separate_past_exposures,0.756 +/- 0.036 (in 3 folds),0.646 +/- 0.061 (in 3 folds),0.009 +/- 0.004 (in 2 folds),0.913 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds),0.920 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds),0.756,0.645,0.006,Unknown,disease.separate_past_exposures,477.0,3.0,480.0,0.00625,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.929 +/- 0.007 (in 3 folds),0.936 +/- 0.007 (in 3 folds),0.931 +/- 0.008 (in 3 folds),0.939 +/- 0.008 (in 3 folds),0.766 +/- 0.010 (in 3 folds),0.655 +/- 0.012 (in 3 folds),0.765,0.654,disease.separate_past_exposures,0.754 +/- 0.015 (in 3 folds),0.642 +/- 0.020 (in 3 folds),0.022 +/- 0.022 (in 2 folds),0.931 +/- 0.000 (in 1 folds),0.940 +/- 0.000 (in 1 folds),0.938 +/- 0.000 (in 1 folds),0.946 +/- 0.000 (in 1 folds),0.754,0.64,0.015,Unknown,disease.separate_past_exposures,473,7,480,0.014583,False
linearsvm_ovr.decision_thresholds_tuned,0.929 +/- 0.007 (in 3 folds),0.936 +/- 0.007 (in 3 folds),0.931 +/- 0.008 (in 3 folds),0.939 +/- 0.008 (in 3 folds),0.757 +/- 0.007 (in 3 folds),0.647 +/- 0.008 (in 3 folds),0.757,0.641,disease.separate_past_exposures,0.746 +/- 0.014 (in 3 folds),0.634 +/- 0.017 (in 3 folds),0.022 +/- 0.022 (in 2 folds),0.931 +/- 0.000 (in 1 folds),0.940 +/- 0.000 (in 1 folds),0.938 +/- 0.000 (in 1 folds),0.946 +/- 0.000 (in 1 folds),0.746,0.628,0.015,Unknown,disease.separate_past_exposures,473,7,480,0.014583,False
lasso_multiclass,0.926 +/- 0.009 (in 3 folds),0.933 +/- 0.010 (in 3 folds),0.927 +/- 0.014 (in 3 folds),0.935 +/- 0.014 (in 3 folds),0.761 +/- 0.010 (in 3 folds),0.650 +/- 0.022 (in 3 folds),0.761,0.649,disease.separate_past_exposures,0.744 +/- 0.031 (in 3 folds),0.630 +/- 0.046 (in 3 folds),0.034 +/- 0.030 (in 2 folds),0.931 +/- 0.000 (in 1 folds),0.940 +/- 0.000 (in 1 folds),0.935 +/- 0.000 (in 1 folds),0.945 +/- 0.000 (in 1 folds),0.744,0.628,0.023,Unknown,disease.separate_past_exposures,469,11,480,0.022917,False
lasso_multiclass.decision_thresholds_tuned,0.926 +/- 0.009 (in 3 folds),0.933 +/- 0.010 (in 3 folds),0.927 +/- 0.014 (in 3 folds),0.935 +/- 0.014 (in 3 folds),0.754 +/- 0.044 (in 3 folds),0.643 +/- 0.059 (in 3 folds),0.755,0.639,disease.separate_past_exposures,0.738 +/- 0.063 (in 3 folds),0.619 +/- 0.089 (in 3 folds),0.034 +/- 0.030 (in 2 folds),0.931 +/- 0.000 (in 1 folds),0.940 +/- 0.000 (in 1 folds),0.935 +/- 0.000 (in 1 folds),0.945 +/- 0.000 (in 1 folds),0.738,0.617,0.023,Unknown,disease.separate_past_exposures,469,11,480,0.022917,False
lasso_cv,0.909 +/- 0.014 (in 3 folds),0.918 +/- 0.015 (in 3 folds),0.914 +/- 0.008 (in 3 folds),0.923 +/- 0.008 (in 3 folds),0.544 +/- 0.017 (in 3 folds),0.317 +/- 0.047 (in 3 folds),0.543,0.318,disease.separate_past_exposures,0.523 +/- 0.016 (in 3 folds),0.267 +/- 0.052 (in 3 folds),0.057 +/- 0.028 (in 2 folds),0.902 +/- 0.000 (in 1 folds),0.914 +/- 0.000 (in 1 folds),0.912 +/- 0.000 (in 1 folds),0.924 +/- 0.000 (in 1 folds),0.523,0.261,0.037,Unknown,disease.separate_past_exposures,462,18,480,0.0375,False
lasso_cv.decision_thresholds_tuned,0.909 +/- 0.014 (in 3 folds),0.918 +/- 0.015 (in 3 folds),0.914 +/- 0.008 (in 3 folds),0.923 +/- 0.008 (in 3 folds),0.758 +/- 0.014 (in 3 folds),0.644 +/- 0.024 (in 3 folds),0.758,0.643,disease.separate_past_exposures,0.729 +/- 0.033 (in 3 folds),0.606 +/- 0.047 (in 3 folds),0.057 +/- 0.028 (in 2 folds),0.902 +/- 0.000 (in 1 folds),0.914 +/- 0.000 (in 1 folds),0.912 +/- 0.000 (in 1 folds),0.924 +/- 0.000 (in 1 folds),0.729,0.605,0.037,Unknown,disease.separate_past_exposures,462,18,480,0.0375,False
elasticnet_cv,0.909 +/- 0.011 (in 3 folds),0.916 +/- 0.011 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.610 +/- 0.132 (in 3 folds),0.390 +/- 0.278 (in 3 folds),0.612,0.44,disease.separate_past_exposures,0.604 +/- 0.141 (in 3 folds),0.379 +/- 0.297 (in 3 folds),0.037 +/- 0.000 (in 1 folds),0.914 +/- 0.010 (in 2 folds),0.921 +/- 0.010 (in 2 folds),0.918 +/- 0.008 (in 2 folds),0.928 +/- 0.007 (in 2 folds),0.604,0.424,0.013,Unknown,disease.separate_past_exposures,474,6,480,0.0125,False
elasticnet_cv.decision_thresholds_tuned,0.909 +/- 0.011 (in 3 folds),0.916 +/- 0.011 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.923 +/- 0.009 (in 3 folds),0.738 +/- 0.054 (in 3 folds),0.633 +/- 0.052 (in 3 folds),0.738,0.623,disease.separate_past_exposures,0.728 +/- 0.053 (in 3 folds),0.621 +/- 0.057 (in 3 folds),0.037 +/- 0.000 (in 1 folds),0.914 +/- 0.010 (in 2 folds),0.921 +/- 0.010 (in 2 folds),0.918 +/- 0.008 (in 2 folds),0.928 +/- 0.007 (in 2 folds),0.729,0.612,0.013,Unknown,disease.separate_past_exposures,474,6,480,0.0125,False
ridge_cv,0.907 +/- 0.010 (in 3 folds),0.917 +/- 0.011 (in 3 folds),0.914 +/- 0.006 (in 3 folds),0.924 +/- 0.006 (in 3 folds),0.576 +/- 0.065 (in 3 folds),0.371 +/- 0.124 (in 3 folds),0.577,0.383,disease.separate_past_exposures,0.572 +/- 0.068 (in 3 folds),0.362 +/- 0.131 (in 3 folds),0.009 +/- 0.004 (in 2 folds),0.913 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds),0.920 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds),0.573,0.374,0.006,Unknown,disease.separate_past_exposures,477,3,480,0.00625,False
ridge_cv.decision_thresholds_tuned,0.907 +/- 0.010 (in 3 folds),0.917 +/- 0.011 (in 3 folds),0.914 +/- 0.006 (in 3 folds),0.924 +/- 0.006 (in 3 folds),0.761 +/- 0.033 (in 3 folds),0.653 +/- 0.056 (in 3 folds),0.761,0.652,disease.separate_past_exposures,0.756 +/- 0.036 (in 3 folds),0.646 +/- 0.061 (in 3 folds),0.009 +/- 0.004 (in 2 folds),0.913 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds),0.920 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds),0.756,0.645,0.006,Unknown,disease.separate_past_exposures,477,3,480,0.00625,False


linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned,lasso_multiclass,lasso_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.929 +/- 0.007 (in 3 folds) ROC-AUC (macro OvO): 0.936 +/- 0.007 (in 3 folds) au-PRC (weighted OvO): 0.931 +/- 0.008 (in 3 folds) au-PRC (macro OvO): 0.939 +/- 0.008 (in 3 folds) Accuracy: 0.766 +/- 0.010 (in 3 folds) MCC: 0.655 +/- 0.012 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.765 MCC: 0.654 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.754 +/- 0.015 (in 3 folds) MCC: 0.642 +/- 0.020 (in 3 folds) Unknown/abstention proportion: 0.022 +/- 0.022 (in 2 folds) ROC-AUC (weighted OvO): 0.931 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.940 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.938 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.946 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.754 MCC: 0.640 Unknown/abstention proportion: 0.015 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.77 0.78 0.77 63  HIV 0.88 0.82 0.85 98 Healthy/Background 0.76 0.84 0.80 221  Lupus 0.64 0.48 0.55 98  Unknown 0.00 0.00 0.00 0  accuracy 0.75 480  macro avg 0.61 0.58 0.59 480  weighted avg 0.76 0.75 0.75 480,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.929 +/- 0.007 (in 3 folds) ROC-AUC (macro OvO): 0.936 +/- 0.007 (in 3 folds) au-PRC (weighted OvO): 0.931 +/- 0.008 (in 3 folds) au-PRC (macro OvO): 0.939 +/- 0.008 (in 3 folds) Accuracy: 0.757 +/- 0.007 (in 3 folds) MCC: 0.647 +/- 0.008 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.757 MCC: 0.641 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.746 +/- 0.014 (in 3 folds) MCC: 0.634 +/- 0.017 (in 3 folds) Unknown/abstention proportion: 0.022 +/- 0.022 (in 2 folds) ROC-AUC (weighted OvO): 0.931 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.940 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.938 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.946 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.746 MCC: 0.628 Unknown/abstention proportion: 0.015 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.81 0.81 0.81 63  HIV 0.87 0.81 0.84 98 Healthy/Background 0.75 0.82 0.78 221  Lupus 0.60 0.48 0.53 98  Unknown 0.00 0.00 0.00 0  accuracy 0.75 480  macro avg 0.61 0.58 0.59 480  weighted avg 0.75 0.75 0.75 480,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.926 +/- 0.009 (in 3 folds) ROC-AUC (macro OvO): 0.933 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.927 +/- 0.014 (in 3 folds) au-PRC (macro OvO): 0.935 +/- 0.014 (in 3 folds) Accuracy: 0.761 +/- 0.010 (in 3 folds) MCC: 0.650 +/- 0.022 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.761 MCC: 0.649 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.744 +/- 0.031 (in 3 folds) MCC: 0.630 +/- 0.046 (in 3 folds) Unknown/abstention proportion: 0.034 +/- 0.030 (in 2 folds) ROC-AUC (weighted OvO): 0.931 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.940 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.935 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.945 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.744 MCC: 0.628 Unknown/abstention proportion: 0.023 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.79 0.76 0.77 63  HIV 0.85 0.83 0.84 98 Healthy/Background 0.78 0.80 0.79 221  Lupus 0.60 0.53 0.57 98  Unknown 0.00 0.00 0.00 0  accuracy 0.74 480  macro avg 0.60 0.58 0.59 480  weighted avg 0.76 0.74 0.75 480,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.926 +/- 0.009 (in 3 folds) ROC-AUC (macro OvO): 0.933 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.927 +/- 0.014 (in 3 folds) au-PRC (macro OvO): 0.935 +/- 0.014 (in 3 folds) Accuracy: 0.754 +/- 0.044 (in 3 folds) MCC: 0.643 +/- 0.059 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.755 MCC: 0.639 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.738 +/- 0.063 (in 3 folds) MCC: 0.619 +/- 0.089 (in 3 folds) Unknown/abstention proportion: 0.034 +/- 0.030 (in 2 folds) ROC-AUC (weighted OvO): 0.931 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.940 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.935 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.945 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.738 MCC: 0.617 Unknown/abstention proportion: 0.023 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.85 0.73 0.79 63  HIV 0.88 0.78 0.83 98 Healthy/Background 0.70 0.90 0.79 221  Lupus 0.73 0.33 0.45 98  Unknown 0.00 0.00 0.00 0  accuracy 0.74 480  macro avg 0.63 0.55 0.57 480  weighted avg 0.76 0.74 0.73 480
,,,


lasso_cv,lasso_cv.decision_thresholds_tuned,elasticnet_cv,elasticnet_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.909 +/- 0.014 (in 3 folds) ROC-AUC (macro OvO): 0.918 +/- 0.015 (in 3 folds) au-PRC (weighted OvO): 0.914 +/- 0.008 (in 3 folds) au-PRC (macro OvO): 0.923 +/- 0.008 (in 3 folds) Accuracy: 0.544 +/- 0.017 (in 3 folds) MCC: 0.317 +/- 0.047 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.543 MCC: 0.318 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.523 +/- 0.016 (in 3 folds) MCC: 0.267 +/- 0.052 (in 3 folds) Unknown/abstention proportion: 0.057 +/- 0.028 (in 2 folds) ROC-AUC (weighted OvO): 0.902 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.914 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.912 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.924 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.523 MCC: 0.261 Unknown/abstention proportion: 0.037 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 1.00 0.03 0.06 63  HIV 1.00 0.30 0.46 98 Healthy/Background 0.50 0.96 0.66 221  Lupus 1.00 0.07 0.13 98  Unknown 0.00 0.00 0.00 0  accuracy 0.52 480  macro avg 0.70 0.27 0.26 480  weighted avg 0.77 0.52 0.43 480,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.909 +/- 0.014 (in 3 folds) ROC-AUC (macro OvO): 0.918 +/- 0.015 (in 3 folds) au-PRC (weighted OvO): 0.914 +/- 0.008 (in 3 folds) au-PRC (macro OvO): 0.923 +/- 0.008 (in 3 folds) Accuracy: 0.758 +/- 0.014 (in 3 folds) MCC: 0.644 +/- 0.024 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.758 MCC: 0.643 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.729 +/- 0.033 (in 3 folds) MCC: 0.606 +/- 0.047 (in 3 folds) Unknown/abstention proportion: 0.057 +/- 0.028 (in 2 folds) ROC-AUC (weighted OvO): 0.902 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.914 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.912 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.924 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.729 MCC: 0.605 Unknown/abstention proportion: 0.037 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.85 0.75 0.80 63  HIV 0.88 0.76 0.81 98 Healthy/Background 0.70 0.87 0.78 221  Lupus 0.74 0.38 0.50 98  Unknown 0.00 0.00 0.00 0  accuracy 0.73 480  macro avg 0.64 0.55 0.58 480  weighted avg 0.77 0.73 0.73 480,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.909 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.916 +/- 0.011 (in 3 folds) au-PRC (weighted OvO): 0.914 +/- 0.009 (in 3 folds) au-PRC (macro OvO): 0.923 +/- 0.009 (in 3 folds) Accuracy: 0.610 +/- 0.132 (in 3 folds) MCC: 0.390 +/- 0.278 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.612 MCC: 0.440 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.604 +/- 0.141 (in 3 folds) MCC: 0.379 +/- 0.297 (in 3 folds) Unknown/abstention proportion: 0.037 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.914 +/- 0.010 (in 2 folds) ROC-AUC (macro OvO): 0.921 +/- 0.010 (in 2 folds) au-PRC (weighted OvO): 0.918 +/- 0.008 (in 2 folds) au-PRC (macro OvO): 0.928 +/- 0.007 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.604 MCC: 0.424 Unknown/abstention proportion: 0.013 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 1.00 0.43 0.60 63  HIV 1.00 0.34 0.50 98 Healthy/Background 0.54 0.98 0.70 221  Lupus 0.82 0.14 0.24 98  Unknown 0.00 0.00 0.00 0  accuracy 0.60 480  macro avg 0.67 0.38 0.41 480  weighted avg 0.75 0.60 0.55 480,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.909 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.916 +/- 0.011 (in 3 folds) au-PRC (weighted OvO): 0.914 +/- 0.009 (in 3 folds) au-PRC (macro OvO): 0.923 +/- 0.009 (in 3 folds) Accuracy: 0.738 +/- 0.054 (in 3 folds) MCC: 0.633 +/- 0.052 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.738 MCC: 0.623 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.728 +/- 0.053 (in 3 folds) MCC: 0.621 +/- 0.057 (in 3 folds) Unknown/abstention proportion: 0.037 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.914 +/- 0.010 (in 2 folds) ROC-AUC (macro OvO): 0.921 +/- 0.010 (in 2 folds) au-PRC (weighted OvO): 0.918 +/- 0.008 (in 2 folds) au-PRC (macro OvO): 0.928 +/- 0.007 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.729 MCC: 0.612 Unknown/abstention proportion: 0.013 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.60 0.87 0.71 63  HIV 0.86 0.76 0.80 98 Healthy/Background 0.76 0.78 0.77 221  Lupus 0.70 0.49 0.57 98  Unknown 0.00 0.00 0.00 0  accuracy 0.73 480  macro avg 0.58 0.58 0.57 480  weighted avg 0.75 0.73 0.73 480
,,,


ridge_cv,ridge_cv.decision_thresholds_tuned,rf_multiclass,rf_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.907 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.917 +/- 0.011 (in 3 folds) au-PRC (weighted OvO): 0.914 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.924 +/- 0.006 (in 3 folds) Accuracy: 0.576 +/- 0.065 (in 3 folds) MCC: 0.371 +/- 0.124 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.577 MCC: 0.383 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.572 +/- 0.068 (in 3 folds) MCC: 0.362 +/- 0.131 (in 3 folds) Unknown/abstention proportion: 0.009 +/- 0.004 (in 2 folds) ROC-AUC (weighted OvO): 0.913 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.923 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.920 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.930 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.573 MCC: 0.374 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 1.00 0.16 0.27 63  HIV 0.97 0.37 0.53 98 Healthy/Background 0.52 1.00 0.69 221  Lupus 1.00 0.09 0.17 98  Unknown 0.00 0.00 0.00 0  accuracy 0.57 480  macro avg 0.70 0.32 0.33 480  weighted avg 0.77 0.57 0.49 480,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.907 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.917 +/- 0.011 (in 3 folds) au-PRC (weighted OvO): 0.914 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.924 +/- 0.006 (in 3 folds) Accuracy: 0.761 +/- 0.033 (in 3 folds) MCC: 0.653 +/- 0.056 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.761 MCC: 0.652 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.756 +/- 0.036 (in 3 folds) MCC: 0.646 +/- 0.061 (in 3 folds) Unknown/abstention proportion: 0.009 +/- 0.004 (in 2 folds) ROC-AUC (weighted OvO): 0.913 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.923 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.920 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.930 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.756 MCC: 0.645 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.87 0.73 0.79 63  HIV 0.91 0.77 0.83 98 Healthy/Background 0.69 0.93 0.80 221  Lupus 0.80 0.37 0.50 98  Unknown 0.00 0.00 0.00 0  accuracy 0.76 480  macro avg 0.66 0.56 0.59 480  weighted avg 0.78 0.76 0.74 480,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.879 +/- 0.022 (in 3 folds) ROC-AUC (macro OvO): 0.886 +/- 0.023 (in 3 folds) au-PRC (weighted OvO): 0.872 +/- 0.028 (in 3 folds) au-PRC (macro OvO): 0.881 +/- 0.029 (in 3 folds) Accuracy: 0.723 +/- 0.038 (in 3 folds) MCC: 0.593 +/- 0.062 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.723 MCC: 0.589 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.701 +/- 0.052 (in 3 folds) MCC: 0.568 +/- 0.071 (in 3 folds) Unknown/abstention proportion: 0.045 +/- 0.046 (in 2 folds) ROC-AUC (weighted OvO): 0.900 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.909 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.904 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.915 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.702 MCC: 0.563 Unknown/abstention proportion: 0.029 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.90 0.73 0.81 63  HIV 0.86 0.77 0.81 98 Healthy/Background 0.70 0.78 0.74 221  Lupus 0.52 0.44 0.48 98  Unknown 0.00 0.00 0.00 0  accuracy 0.70 480  macro avg 0.60 0.54 0.57 480  weighted avg 0.73 0.70 0.71 480,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.879 +/- 0.022 (in 3 folds) ROC-AUC (macro OvO): 0.886 +/- 0.023 (in 3 folds) au-PRC (weighted OvO): 0.872 +/- 0.028 (in 3 folds) au-PRC (macro OvO): 0.881 +/- 0.029 (in 3 folds) Accuracy: 0.729 +/- 0.038 (in 3 folds) MCC: 0.609 +/- 0.061 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.730 MCC: 0.603 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.708 +/- 0.051 (in 3 folds) MCC: 0.585 +/- 0.066 (in 3 folds) Unknown/abstention proportion: 0.045 +/- 0.046 (in 2 folds) ROC-AUC (weighted OvO): 0.900 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.909 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.904 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.915 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.708 MCC: 0.577 Unknown/abstention proportion: 0.029 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.90 0.73 0.81 63  HIV 0.84 0.80 0.82 98 Healthy/Background 0.73 0.75 0.74 221  Lupus 0.53 0.51 0.52 98  Unknown 0.00 0.00 0.00 0  accuracy 0.71 480  macro avg 0.60 0.56 0.58 480  weighted avg 0.73 0.71 0.72 480
,,,


xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.870 +/- 0.026 (in 3 folds) ROC-AUC (macro OvO): 0.874 +/- 0.027 (in 3 folds) au-PRC (weighted OvO): 0.871 +/- 0.033 (in 3 folds) au-PRC (macro OvO): 0.880 +/- 0.034 (in 3 folds) Accuracy: 0.693 +/- 0.064 (in 3 folds) MCC: 0.547 +/- 0.103 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.693 MCC: 0.545 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.672 +/- 0.069 (in 3 folds) MCC: 0.524 +/- 0.103 (in 3 folds) Unknown/abstention proportion: 0.045 +/- 0.046 (in 2 folds) ROC-AUC (weighted OvO): 0.892 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.897 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.905 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.915 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.673 MCC: 0.521 Unknown/abstention proportion: 0.029 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.83 0.71 0.77 63  HIV 0.84 0.76 0.80 98 Healthy/Background 0.69 0.76 0.72 221  Lupus 0.45 0.38 0.41 98  Unknown 0.00 0.00 0.00 0  accuracy 0.67 480  macro avg 0.56 0.52 0.54 480  weighted avg 0.69 0.67 0.68 480,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.870 +/- 0.026 (in 3 folds) ROC-AUC (macro OvO): 0.874 +/- 0.027 (in 3 folds) au-PRC (weighted OvO): 0.871 +/- 0.033 (in 3 folds) au-PRC (macro OvO): 0.880 +/- 0.034 (in 3 folds) Accuracy: 0.718 +/- 0.039 (in 3 folds) MCC: 0.599 +/- 0.056 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.719 MCC: 0.591 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.697 +/- 0.056 (in 3 folds) MCC: 0.576 +/- 0.066 (in 3 folds) Unknown/abstention proportion: 0.045 +/- 0.046 (in 2 folds) ROC-AUC (weighted OvO): 0.892 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.897 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.905 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.915 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.698 MCC: 0.567 Unknown/abstention proportion: 0.029 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.82 0.78 0.80 63  HIV 0.80 0.83 0.81 98 Healthy/Background 0.75 0.73 0.74 221  Lupus 0.48 0.44 0.46 98  Unknown 0.00 0.00 0.00 0  accuracy 0.70 480  macro avg 0.57 0.56 0.56 480  weighted avg 0.72 0.70 0.71 480
,


---

# GeneLocus.BCR, TargetObsColumnEnum.disease_all_demographics_present trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.914 +/- 0.004 (in 3 folds),0.924 +/- 0.006 (in 3 folds),0.921 +/- 0.006 (in 3 folds),0.931 +/- 0.009 (in 3 folds),0.746 +/- 0.026 (in 3 folds),0.620 +/- 0.030 (in 3 folds),0.746,0.62,0.741 +/- 0.029 (in 3 folds),0.614 +/- 0.030 (in 3 folds),0.010 +/- 0.000 (in 2 folds),0.910 +/- 0.000 (in 1 folds),0.916 +/- 0.000 (in 1 folds),0.916 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds),0.74,0.614,0.007,Unknown,283.0,2.0,285.0,0.007018,False
lasso_multiclass,0.911 +/- 0.014 (in 3 folds),0.921 +/- 0.013 (in 3 folds),0.920 +/- 0.014 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.738 +/- 0.028 (in 3 folds),0.622 +/- 0.043 (in 3 folds),0.738,0.618,0.730 +/- 0.028 (in 3 folds),0.613 +/- 0.042 (in 3 folds),0.011 +/- 0.000 (in 3 folds),,,,,0.73,0.609,0.011,Unknown,282.0,3.0,285.0,0.010526,False
ridge_cv,0.900 +/- 0.015 (in 3 folds),0.912 +/- 0.017 (in 3 folds),0.902 +/- 0.025 (in 3 folds),0.916 +/- 0.027 (in 3 folds),0.534 +/- 0.111 (in 3 folds),0.171 +/- 0.296 (in 3 folds),0.535,0.292,0.508 +/- 0.120 (in 3 folds),0.193 +/- 0.256 (in 3 folds),0.050 +/- 0.068 (in 3 folds),,,,,0.509,0.229,0.049,Unknown,271.0,14.0,285.0,0.049123,False
xgboost,0.890 +/- 0.015 (in 3 folds),0.894 +/- 0.021 (in 3 folds),0.899 +/- 0.017 (in 3 folds),0.907 +/- 0.024 (in 3 folds),0.728 +/- 0.016 (in 3 folds),0.593 +/- 0.040 (in 3 folds),0.728,0.592,0.712 +/- 0.006 (in 3 folds),0.574 +/- 0.022 (in 3 folds),0.031 +/- 0.015 (in 2 folds),0.874 +/- 0.000 (in 1 folds),0.870 +/- 0.000 (in 1 folds),0.880 +/- 0.000 (in 1 folds),0.880 +/- 0.000 (in 1 folds),0.712,0.573,0.021,Unknown,279.0,6.0,285.0,0.021053,False
lasso_cv,0.884 +/- 0.031 (in 3 folds),0.898 +/- 0.030 (in 3 folds),0.888 +/- 0.032 (in 3 folds),0.905 +/- 0.032 (in 3 folds),0.588 +/- 0.142 (in 3 folds),0.380 +/- 0.206 (in 3 folds),0.587,0.376,0.584 +/- 0.144 (in 3 folds),0.367 +/- 0.212 (in 3 folds),0.010 +/- 0.000 (in 2 folds),0.850 +/- 0.000 (in 1 folds),0.867 +/- 0.000 (in 1 folds),0.851 +/- 0.000 (in 1 folds),0.868 +/- 0.000 (in 1 folds),0.582,0.367,0.007,Unknown,283.0,2.0,285.0,0.007018,False
rf_multiclass,0.878 +/- 0.018 (in 3 folds),0.885 +/- 0.022 (in 3 folds),0.883 +/- 0.025 (in 3 folds),0.893 +/- 0.028 (in 3 folds),0.739 +/- 0.019 (in 3 folds),0.612 +/- 0.042 (in 3 folds),0.739,0.612,0.726 +/- 0.021 (in 3 folds),0.596 +/- 0.032 (in 3 folds),0.026 +/- 0.022 (in 2 folds),0.879 +/- 0.000 (in 1 folds),0.885 +/- 0.000 (in 1 folds),0.881 +/- 0.000 (in 1 folds),0.890 +/- 0.000 (in 1 folds),0.726,0.594,0.018,Unknown,280.0,5.0,285.0,0.017544,False
elasticnet_cv,0.878 +/- 0.013 (in 3 folds),0.891 +/- 0.009 (in 3 folds),0.896 +/- 0.015 (in 3 folds),0.911 +/- 0.012 (in 3 folds),0.610 +/- 0.143 (in 3 folds),0.422 +/- 0.212 (in 3 folds),0.611,0.431,0.601 +/- 0.150 (in 3 folds),0.391 +/- 0.247 (in 3 folds),0.026 +/- 0.022 (in 2 folds),0.865 +/- 0.000 (in 1 folds),0.883 +/- 0.000 (in 1 folds),0.879 +/- 0.000 (in 1 folds),0.897 +/- 0.000 (in 1 folds),0.6,0.405,0.018,Unknown,280.0,5.0,285.0,0.017544,False
dummy_stratified,0.549 +/- 0.026 (in 3 folds),0.547 +/- 0.016 (in 3 folds),0.533 +/- 0.013 (in 3 folds),0.534 +/- 0.009 (in 3 folds),0.414 +/- 0.059 (in 3 folds),0.110 +/- 0.066 (in 3 folds),0.41,0.105,0.393 +/- 0.023 (in 3 folds),0.104 +/- 0.055 (in 3 folds),0.129 +/- 0.000 (in 1 folds),0.535 +/- 0.012 (in 2 folds),0.540 +/- 0.013 (in 2 folds),0.526 +/- 0.006 (in 2 folds),0.529 +/- 0.007 (in 2 folds),0.393,0.102,0.042,Unknown,273.0,12.0,285.0,0.042105,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.474 +/- 0.043 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.472,0.0,0.442 +/- 0.013 (in 3 folds),0.035 +/- 0.020 (in 3 folds),0.064 +/- 0.060 (in 3 folds),,,,,0.442,0.029,0.063,Unknown,267.0,18.0,285.0,0.063158,True
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.914 +/- 0.004 (in 3 folds),0.924 +/- 0.006 (in 3 folds),0.921 +/- 0.006 (in 3 folds),0.931 +/- 0.009 (in 3 folds),0.746 +/- 0.026 (in 3 folds),0.620 +/- 0.030 (in 3 folds),0.746,0.62,0.741 +/- 0.029 (in 3 folds),0.614 +/- 0.030 (in 3 folds),0.010 +/- 0.000 (in 2 folds),0.910 +/- 0.000 (in 1 folds),0.916 +/- 0.000 (in 1 folds),0.916 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds),0.74,0.614,0.007,Unknown,283,2,285,0.007018,False
lasso_multiclass,0.911 +/- 0.014 (in 3 folds),0.921 +/- 0.013 (in 3 folds),0.920 +/- 0.014 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.738 +/- 0.028 (in 3 folds),0.622 +/- 0.043 (in 3 folds),0.738,0.618,0.730 +/- 0.028 (in 3 folds),0.613 +/- 0.042 (in 3 folds),0.011 +/- 0.000 (in 3 folds),,,,,0.73,0.609,0.011,Unknown,282,3,285,0.010526,False
ridge_cv,0.900 +/- 0.015 (in 3 folds),0.912 +/- 0.017 (in 3 folds),0.902 +/- 0.025 (in 3 folds),0.916 +/- 0.027 (in 3 folds),0.534 +/- 0.111 (in 3 folds),0.171 +/- 0.296 (in 3 folds),0.535,0.292,0.508 +/- 0.120 (in 3 folds),0.193 +/- 0.256 (in 3 folds),0.050 +/- 0.068 (in 3 folds),,,,,0.509,0.229,0.049,Unknown,271,14,285,0.049123,False
xgboost,0.890 +/- 0.015 (in 3 folds),0.894 +/- 0.021 (in 3 folds),0.899 +/- 0.017 (in 3 folds),0.907 +/- 0.024 (in 3 folds),0.728 +/- 0.016 (in 3 folds),0.593 +/- 0.040 (in 3 folds),0.728,0.592,0.712 +/- 0.006 (in 3 folds),0.574 +/- 0.022 (in 3 folds),0.031 +/- 0.015 (in 2 folds),0.874 +/- 0.000 (in 1 folds),0.870 +/- 0.000 (in 1 folds),0.880 +/- 0.000 (in 1 folds),0.880 +/- 0.000 (in 1 folds),0.712,0.573,0.021,Unknown,279,6,285,0.021053,False
lasso_cv,0.884 +/- 0.031 (in 3 folds),0.898 +/- 0.030 (in 3 folds),0.888 +/- 0.032 (in 3 folds),0.905 +/- 0.032 (in 3 folds),0.588 +/- 0.142 (in 3 folds),0.380 +/- 0.206 (in 3 folds),0.587,0.376,0.584 +/- 0.144 (in 3 folds),0.367 +/- 0.212 (in 3 folds),0.010 +/- 0.000 (in 2 folds),0.850 +/- 0.000 (in 1 folds),0.867 +/- 0.000 (in 1 folds),0.851 +/- 0.000 (in 1 folds),0.868 +/- 0.000 (in 1 folds),0.582,0.367,0.007,Unknown,283,2,285,0.007018,False
rf_multiclass,0.878 +/- 0.018 (in 3 folds),0.885 +/- 0.022 (in 3 folds),0.883 +/- 0.025 (in 3 folds),0.893 +/- 0.028 (in 3 folds),0.739 +/- 0.019 (in 3 folds),0.612 +/- 0.042 (in 3 folds),0.739,0.612,0.726 +/- 0.021 (in 3 folds),0.596 +/- 0.032 (in 3 folds),0.026 +/- 0.022 (in 2 folds),0.879 +/- 0.000 (in 1 folds),0.885 +/- 0.000 (in 1 folds),0.881 +/- 0.000 (in 1 folds),0.890 +/- 0.000 (in 1 folds),0.726,0.594,0.018,Unknown,280,5,285,0.017544,False
elasticnet_cv,0.878 +/- 0.013 (in 3 folds),0.891 +/- 0.009 (in 3 folds),0.896 +/- 0.015 (in 3 folds),0.911 +/- 0.012 (in 3 folds),0.610 +/- 0.143 (in 3 folds),0.422 +/- 0.212 (in 3 folds),0.611,0.431,0.601 +/- 0.150 (in 3 folds),0.391 +/- 0.247 (in 3 folds),0.026 +/- 0.022 (in 2 folds),0.865 +/- 0.000 (in 1 folds),0.883 +/- 0.000 (in 1 folds),0.879 +/- 0.000 (in 1 folds),0.897 +/- 0.000 (in 1 folds),0.6,0.405,0.018,Unknown,280,5,285,0.017544,False
dummy_stratified,0.549 +/- 0.026 (in 3 folds),0.547 +/- 0.016 (in 3 folds),0.533 +/- 0.013 (in 3 folds),0.534 +/- 0.009 (in 3 folds),0.414 +/- 0.059 (in 3 folds),0.110 +/- 0.066 (in 3 folds),0.41,0.105,0.393 +/- 0.023 (in 3 folds),0.104 +/- 0.055 (in 3 folds),0.129 +/- 0.000 (in 1 folds),0.535 +/- 0.012 (in 2 folds),0.540 +/- 0.013 (in 2 folds),0.526 +/- 0.006 (in 2 folds),0.529 +/- 0.007 (in 2 folds),0.393,0.102,0.042,Unknown,273,12,285,0.042105,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.474 +/- 0.043 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.472,0.0,0.442 +/- 0.013 (in 3 folds),0.035 +/- 0.020 (in 3 folds),0.064 +/- 0.060 (in 3 folds),,,,,0.442,0.029,0.063,Unknown,267,18,285,0.063158,True


linearsvm_ovr,lasso_multiclass,ridge_cv,xgboost
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.914 +/- 0.004 (in 3 folds) ROC-AUC (macro OvO): 0.924 +/- 0.006 (in 3 folds) au-PRC (weighted OvO): 0.921 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.931 +/- 0.009 (in 3 folds) Accuracy: 0.746 +/- 0.026 (in 3 folds) MCC: 0.620 +/- 0.030 (in 3 folds) Global scores without abstention: Accuracy: 0.746 MCC: 0.620 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.741 +/- 0.029 (in 3 folds) MCC: 0.614 +/- 0.030 (in 3 folds) Unknown/abstention proportion: 0.010 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.910 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.916 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.916 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.923 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.740 MCC: 0.614 Unknown/abstention proportion: 0.007 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.95 0.64 0.76 33  HIV 0.81 0.85 0.83 55 Healthy/Background 0.74 0.83 0.78 132  Lupus 0.61 0.51 0.55 65  Unknown 0.00 0.00 0.00 0  accuracy 0.74 285  macro avg 0.62 0.57 0.59 285  weighted avg 0.75 0.74 0.74 285,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.911 +/- 0.014 (in 3 folds) ROC-AUC (macro OvO): 0.921 +/- 0.013 (in 3 folds) au-PRC (weighted OvO): 0.920 +/- 0.014 (in 3 folds) au-PRC (macro OvO): 0.930 +/- 0.014 (in 3 folds) Accuracy: 0.738 +/- 0.028 (in 3 folds) MCC: 0.622 +/- 0.043 (in 3 folds) Global scores without abstention: Accuracy: 0.738 MCC: 0.618 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.730 +/- 0.028 (in 3 folds) MCC: 0.613 +/- 0.042 (in 3 folds) Unknown/abstention proportion: 0.011 +/- 0.000 (in 3 folds) Global scores with abstention: Accuracy: 0.730 MCC: 0.609 Unknown/abstention proportion: 0.011 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.71 0.73 0.72 33  HIV 0.82 0.85 0.84 55 Healthy/Background 0.77 0.74 0.76 132  Lupus 0.61 0.60 0.60 65  Unknown 0.00 0.00 0.00 0  accuracy 0.73 285  macro avg 0.58 0.58 0.58 285  weighted avg 0.74 0.73 0.73 285,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.900 +/- 0.015 (in 3 folds) ROC-AUC (macro OvO): 0.912 +/- 0.017 (in 3 folds) au-PRC (weighted OvO): 0.902 +/- 0.025 (in 3 folds) au-PRC (macro OvO): 0.916 +/- 0.027 (in 3 folds) Accuracy: 0.534 +/- 0.111 (in 3 folds) MCC: 0.171 +/- 0.296 (in 3 folds) Global scores without abstention: Accuracy: 0.535 MCC: 0.292 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.508 +/- 0.120 (in 3 folds) MCC: 0.193 +/- 0.256 (in 3 folds) Unknown/abstention proportion: 0.050 +/- 0.068 (in 3 folds) Global scores with abstention: Accuracy: 0.509 MCC: 0.229 Unknown/abstention proportion: 0.049 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 1.00 0.15 0.26 33  HIV 1.00 0.16 0.28 55 Healthy/Background 0.50 0.96 0.66 132  Lupus 1.00 0.06 0.12 65  Unknown 0.00 0.00 0.00 0  accuracy 0.51 285  macro avg 0.70 0.27 0.26 285  weighted avg 0.77 0.51 0.42 285,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.890 +/- 0.015 (in 3 folds) ROC-AUC (macro OvO): 0.894 +/- 0.021 (in 3 folds) au-PRC (weighted OvO): 0.899 +/- 0.017 (in 3 folds) au-PRC (macro OvO): 0.907 +/- 0.024 (in 3 folds) Accuracy: 0.728 +/- 0.016 (in 3 folds) MCC: 0.593 +/- 0.040 (in 3 folds) Global scores without abstention: Accuracy: 0.728 MCC: 0.592 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.712 +/- 0.006 (in 3 folds) MCC: 0.574 +/- 0.022 (in 3 folds) Unknown/abstention proportion: 0.031 +/- 0.015 (in 2 folds) ROC-AUC (weighted OvO): 0.874 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.870 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.880 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.880 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.712 MCC: 0.573 Unknown/abstention proportion: 0.021 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.92 0.70 0.79 33  HIV 0.80 0.75 0.77 55 Healthy/Background 0.72 0.82 0.76 132  Lupus 0.60 0.48 0.53 65  Unknown 0.00 0.00 0.00 0  accuracy 0.71 285  macro avg 0.61 0.55 0.57 285  weighted avg 0.73 0.71 0.72 285
,,,


lasso_cv,rf_multiclass,elasticnet_cv,dummy_stratified
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.884 +/- 0.031 (in 3 folds) ROC-AUC (macro OvO): 0.898 +/- 0.030 (in 3 folds) au-PRC (weighted OvO): 0.888 +/- 0.032 (in 3 folds) au-PRC (macro OvO): 0.905 +/- 0.032 (in 3 folds) Accuracy: 0.588 +/- 0.142 (in 3 folds) MCC: 0.380 +/- 0.206 (in 3 folds) Global scores without abstention: Accuracy: 0.587 MCC: 0.376 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.584 +/- 0.144 (in 3 folds) MCC: 0.367 +/- 0.212 (in 3 folds) Unknown/abstention proportion: 0.010 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.850 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.867 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.851 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.868 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.582 MCC: 0.367 Unknown/abstention proportion: 0.007 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 1.00 0.24 0.39 33  HIV 0.96 0.40 0.56 55 Healthy/Background 0.53 0.95 0.68 132  Lupus 0.62 0.15 0.25 65  Unknown 0.00 0.00 0.00 0  accuracy 0.58 285  macro avg 0.62 0.35 0.38 285  weighted avg 0.69 0.58 0.53 285,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.878 +/- 0.018 (in 3 folds) ROC-AUC (macro OvO): 0.885 +/- 0.022 (in 3 folds) au-PRC (weighted OvO): 0.883 +/- 0.025 (in 3 folds) au-PRC (macro OvO): 0.893 +/- 0.028 (in 3 folds) Accuracy: 0.739 +/- 0.019 (in 3 folds) MCC: 0.612 +/- 0.042 (in 3 folds) Global scores without abstention: Accuracy: 0.739 MCC: 0.612 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.726 +/- 0.021 (in 3 folds) MCC: 0.596 +/- 0.032 (in 3 folds) Unknown/abstention proportion: 0.026 +/- 0.022 (in 2 folds) ROC-AUC (weighted OvO): 0.879 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.885 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.881 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.890 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.726 MCC: 0.594 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.80 0.73 0.76 33  HIV 0.94 0.80 0.86 55 Healthy/Background 0.71 0.84 0.77 132  Lupus 0.61 0.43 0.50 65  Unknown 0.00 0.00 0.00 0  accuracy 0.73 285  macro avg 0.61 0.56 0.58 285  weighted avg 0.74 0.73 0.73 285,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.878 +/- 0.013 (in 3 folds) ROC-AUC (macro OvO): 0.891 +/- 0.009 (in 3 folds) au-PRC (weighted OvO): 0.896 +/- 0.015 (in 3 folds) au-PRC (macro OvO): 0.911 +/- 0.012 (in 3 folds) Accuracy: 0.610 +/- 0.143 (in 3 folds) MCC: 0.422 +/- 0.212 (in 3 folds) Global scores without abstention: Accuracy: 0.611 MCC: 0.431 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.865 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.883 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.879 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.897 +/- 0.000 (in 1 folds) Accuracy: 0.601 +/- 0.150 (in 3 folds) MCC: 0.391 +/- 0.247 (in 3 folds) Unknown/abstention proportion: 0.026 +/- 0.022 (in 2 folds) Global scores with abstention: Accuracy: 0.600 MCC: 0.405 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.92 0.33 0.49 33  HIV 0.92 0.44 0.59 55 Healthy/Background 0.54 0.95 0.69 132  Lupus 0.92 0.17 0.29 65  Unknown 0.00 0.00 0.00 0  accuracy 0.60 285  macro avg 0.66 0.38 0.41 285  weighted avg 0.75 0.60 0.56 285,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.549 +/- 0.026 (in 3 folds) ROC-AUC (macro OvO): 0.547 +/- 0.016 (in 3 folds) au-PRC (weighted OvO): 0.533 +/- 0.013 (in 3 folds) au-PRC (macro OvO): 0.534 +/- 0.009 (in 3 folds) Accuracy: 0.414 +/- 0.059 (in 3 folds) MCC: 0.110 +/- 0.066 (in 3 folds) Global scores without abstention: Accuracy: 0.410 MCC: 0.105 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.535 +/- 0.012 (in 2 folds) ROC-AUC (macro OvO): 0.540 +/- 0.013 (in 2 folds) au-PRC (weighted OvO): 0.526 +/- 0.006 (in 2 folds) au-PRC (macro OvO): 0.529 +/- 0.007 (in 2 folds) Accuracy: 0.393 +/- 0.023 (in 3 folds) MCC: 0.104 +/- 0.055 (in 3 folds) Unknown/abstention proportion: 0.129 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.393 MCC: 0.102 Unknown/abstention proportion: 0.042 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.23 0.15 0.18 33  HIV 0.30 0.35 0.32 55 Healthy/Background 0.52 0.59 0.56 132  Lupus 0.26 0.15 0.19 65  Unknown 0.00 0.00 0.00 0  accuracy 0.39 285  macro avg 0.26 0.25 0.25 285  weighted avg 0.39 0.39 0.38 285
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 3 folds) Accuracy: 0.474 +/- 0.043 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.472 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.442 +/- 0.013 (in 3 folds) MCC: 0.035 +/- 0.020 (in 3 folds) Unknown/abstention proportion: 0.064 +/- 0.060 (in 3 folds) Global scores with abstention: Accuracy: 0.442 MCC: 0.029 Unknown/abstention proportion: 0.063 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.00 0.00 0.00 33  HIV 0.00 0.00 0.00 55 Healthy/Background 0.47 0.95 0.63 132  Lupus 0.00 0.00 0.00 65  Unknown 0.00 0.00 0.00 0  accuracy 0.44 285  macro avg 0.09 0.19 0.13 285  weighted avg 0.22 0.44 0.29 285


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
lasso_multiclass,0.920 +/- 0.020 (in 3 folds),0.927 +/- 0.022 (in 3 folds),0.924 +/- 0.014 (in 3 folds),0.932 +/- 0.015 (in 3 folds),0.730 +/- 0.051 (in 3 folds),0.611 +/- 0.069 (in 3 folds),0.729,0.609,disease.separate_past_exposures,0.719 +/- 0.046 (in 3 folds),0.599 +/- 0.063 (in 3 folds),0.014 +/- 0.007 (in 3 folds),0.719,0.597,0.014,Unknown,disease.separate_past_exposures,414.0,6.0,420.0,0.014286,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.920 +/- 0.020 (in 3 folds),0.927 +/- 0.022 (in 3 folds),0.924 +/- 0.014 (in 3 folds),0.932 +/- 0.015 (in 3 folds),0.698 +/- 0.066 (in 3 folds),0.596 +/- 0.069 (in 3 folds),0.698,0.573,disease.separate_past_exposures,0.688 +/- 0.066 (in 3 folds),0.583 +/- 0.072 (in 3 folds),0.014 +/- 0.007 (in 3 folds),0.688,0.56,0.014,Unknown,disease.separate_past_exposures,414.0,6.0,420.0,0.014286,False,,,,
linearsvm_ovr,0.915 +/- 0.017 (in 3 folds),0.923 +/- 0.019 (in 3 folds),0.921 +/- 0.013 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.733 +/- 0.029 (in 3 folds),0.605 +/- 0.038 (in 3 folds),0.733,0.602,disease.separate_past_exposures,0.724 +/- 0.023 (in 3 folds),0.595 +/- 0.033 (in 3 folds),0.018 +/- 0.005 (in 2 folds),0.724,0.592,0.012,Unknown,disease.separate_past_exposures,415.0,5.0,420.0,0.011905,False,0.915 +/- 0.000 (in 1 folds),0.924 +/- 0.000 (in 1 folds),0.926 +/- 0.000 (in 1 folds),0.935 +/- 0.000 (in 1 folds)
linearsvm_ovr.decision_thresholds_tuned,0.915 +/- 0.017 (in 3 folds),0.923 +/- 0.019 (in 3 folds),0.921 +/- 0.013 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.670 +/- 0.053 (in 3 folds),0.559 +/- 0.057 (in 3 folds),0.67,0.527,disease.separate_past_exposures,0.662 +/- 0.052 (in 3 folds),0.548 +/- 0.054 (in 3 folds),0.018 +/- 0.005 (in 2 folds),0.662,0.518,0.012,Unknown,disease.separate_past_exposures,415.0,5.0,420.0,0.011905,False,0.915 +/- 0.000 (in 1 folds),0.924 +/- 0.000 (in 1 folds),0.926 +/- 0.000 (in 1 folds),0.935 +/- 0.000 (in 1 folds)
ridge_cv,0.914 +/- 0.031 (in 3 folds),0.923 +/- 0.031 (in 3 folds),0.924 +/- 0.015 (in 3 folds),0.933 +/- 0.015 (in 3 folds),0.527 +/- 0.160 (in 3 folds),0.192 +/- 0.333 (in 3 folds),0.531,0.302,disease.separate_past_exposures,0.502 +/- 0.174 (in 3 folds),0.176 +/- 0.332 (in 3 folds),0.055 +/- 0.065 (in 3 folds),0.502,0.229,0.055,Unknown,disease.separate_past_exposures,397.0,23.0,420.0,0.054762,False,,,,
ridge_cv.decision_thresholds_tuned,0.914 +/- 0.031 (in 3 folds),0.923 +/- 0.031 (in 3 folds),0.924 +/- 0.015 (in 3 folds),0.933 +/- 0.015 (in 3 folds),0.424 +/- 0.341 (in 3 folds),0.218 +/- 0.378 (in 3 folds),0.423,0.197,disease.separate_past_exposures,0.401 +/- 0.335 (in 3 folds),0.207 +/- 0.373 (in 3 folds),0.055 +/- 0.065 (in 3 folds),0.4,0.182,0.055,Unknown,disease.separate_past_exposures,397.0,23.0,420.0,0.054762,False,,,,
elasticnet_cv,0.907 +/- 0.015 (in 3 folds),0.915 +/- 0.016 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.925 +/- 0.008 (in 3 folds),0.637 +/- 0.132 (in 3 folds),0.432 +/- 0.294 (in 3 folds),0.638,0.481,disease.separate_past_exposures,0.629 +/- 0.141 (in 3 folds),0.425 +/- 0.301 (in 3 folds),0.021 +/- 0.020 (in 2 folds),0.629,0.467,0.014,Unknown,disease.separate_past_exposures,414.0,6.0,420.0,0.014286,False,0.921 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds),0.919 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds)
elasticnet_cv.decision_thresholds_tuned,0.907 +/- 0.015 (in 3 folds),0.915 +/- 0.016 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.925 +/- 0.008 (in 3 folds),0.727 +/- 0.036 (in 3 folds),0.609 +/- 0.065 (in 3 folds),0.727,0.594,disease.separate_past_exposures,0.717 +/- 0.042 (in 3 folds),0.597 +/- 0.075 (in 3 folds),0.021 +/- 0.020 (in 2 folds),0.717,0.582,0.014,Unknown,disease.separate_past_exposures,414.0,6.0,420.0,0.014286,False,0.921 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds),0.919 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds)
xgboost,0.904 +/- 0.005 (in 3 folds),0.910 +/- 0.007 (in 3 folds),0.910 +/- 0.003 (in 3 folds),0.920 +/- 0.003 (in 3 folds),0.756 +/- 0.019 (in 3 folds),0.642 +/- 0.029 (in 3 folds),0.757,0.64,disease.separate_past_exposures,0.733 +/- 0.036 (in 3 folds),0.616 +/- 0.052 (in 3 folds),0.046 +/- 0.015 (in 2 folds),0.733,0.611,0.031,Unknown,disease.separate_past_exposures,407.0,13.0,420.0,0.030952,False,0.903 +/- 0.000 (in 1 folds),0.910 +/- 0.000 (in 1 folds),0.914 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds)
xgboost.decision_thresholds_tuned,0.904 +/- 0.005 (in 3 folds),0.910 +/- 0.007 (in 3 folds),0.910 +/- 0.003 (in 3 folds),0.920 +/- 0.003 (in 3 folds),0.737 +/- 0.024 (in 3 folds),0.613 +/- 0.029 (in 3 folds),0.737,0.613,disease.separate_past_exposures,0.714 +/- 0.031 (in 3 folds),0.585 +/- 0.047 (in 3 folds),0.046 +/- 0.015 (in 2 folds),0.714,0.586,0.031,Unknown,disease.separate_past_exposures,407.0,13.0,420.0,0.030952,False,0.903 +/- 0.000 (in 1 folds),0.910 +/- 0.000 (in 1 folds),0.914 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds)

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
lasso_multiclass,0.920 +/- 0.020 (in 3 folds),0.927 +/- 0.022 (in 3 folds),0.924 +/- 0.014 (in 3 folds),0.932 +/- 0.015 (in 3 folds),0.730 +/- 0.051 (in 3 folds),0.611 +/- 0.069 (in 3 folds),0.729,0.609,disease.separate_past_exposures,0.719 +/- 0.046 (in 3 folds),0.599 +/- 0.063 (in 3 folds),0.014 +/- 0.007 (in 3 folds),0.719,0.597,0.014,Unknown,disease.separate_past_exposures,414,6,420,0.014286,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.920 +/- 0.020 (in 3 folds),0.927 +/- 0.022 (in 3 folds),0.924 +/- 0.014 (in 3 folds),0.932 +/- 0.015 (in 3 folds),0.698 +/- 0.066 (in 3 folds),0.596 +/- 0.069 (in 3 folds),0.698,0.573,disease.separate_past_exposures,0.688 +/- 0.066 (in 3 folds),0.583 +/- 0.072 (in 3 folds),0.014 +/- 0.007 (in 3 folds),0.688,0.56,0.014,Unknown,disease.separate_past_exposures,414,6,420,0.014286,False,,,,
linearsvm_ovr,0.915 +/- 0.017 (in 3 folds),0.923 +/- 0.019 (in 3 folds),0.921 +/- 0.013 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.733 +/- 0.029 (in 3 folds),0.605 +/- 0.038 (in 3 folds),0.733,0.602,disease.separate_past_exposures,0.724 +/- 0.023 (in 3 folds),0.595 +/- 0.033 (in 3 folds),0.018 +/- 0.005 (in 2 folds),0.724,0.592,0.012,Unknown,disease.separate_past_exposures,415,5,420,0.011905,False,0.915 +/- 0.000 (in 1 folds),0.924 +/- 0.000 (in 1 folds),0.926 +/- 0.000 (in 1 folds),0.935 +/- 0.000 (in 1 folds)
linearsvm_ovr.decision_thresholds_tuned,0.915 +/- 0.017 (in 3 folds),0.923 +/- 0.019 (in 3 folds),0.921 +/- 0.013 (in 3 folds),0.930 +/- 0.014 (in 3 folds),0.670 +/- 0.053 (in 3 folds),0.559 +/- 0.057 (in 3 folds),0.67,0.527,disease.separate_past_exposures,0.662 +/- 0.052 (in 3 folds),0.548 +/- 0.054 (in 3 folds),0.018 +/- 0.005 (in 2 folds),0.662,0.518,0.012,Unknown,disease.separate_past_exposures,415,5,420,0.011905,False,0.915 +/- 0.000 (in 1 folds),0.924 +/- 0.000 (in 1 folds),0.926 +/- 0.000 (in 1 folds),0.935 +/- 0.000 (in 1 folds)
ridge_cv,0.914 +/- 0.031 (in 3 folds),0.923 +/- 0.031 (in 3 folds),0.924 +/- 0.015 (in 3 folds),0.933 +/- 0.015 (in 3 folds),0.527 +/- 0.160 (in 3 folds),0.192 +/- 0.333 (in 3 folds),0.531,0.302,disease.separate_past_exposures,0.502 +/- 0.174 (in 3 folds),0.176 +/- 0.332 (in 3 folds),0.055 +/- 0.065 (in 3 folds),0.502,0.229,0.055,Unknown,disease.separate_past_exposures,397,23,420,0.054762,False,,,,
ridge_cv.decision_thresholds_tuned,0.914 +/- 0.031 (in 3 folds),0.923 +/- 0.031 (in 3 folds),0.924 +/- 0.015 (in 3 folds),0.933 +/- 0.015 (in 3 folds),0.424 +/- 0.341 (in 3 folds),0.218 +/- 0.378 (in 3 folds),0.423,0.197,disease.separate_past_exposures,0.401 +/- 0.335 (in 3 folds),0.207 +/- 0.373 (in 3 folds),0.055 +/- 0.065 (in 3 folds),0.4,0.182,0.055,Unknown,disease.separate_past_exposures,397,23,420,0.054762,False,,,,
elasticnet_cv,0.907 +/- 0.015 (in 3 folds),0.915 +/- 0.016 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.925 +/- 0.008 (in 3 folds),0.637 +/- 0.132 (in 3 folds),0.432 +/- 0.294 (in 3 folds),0.638,0.481,disease.separate_past_exposures,0.629 +/- 0.141 (in 3 folds),0.425 +/- 0.301 (in 3 folds),0.021 +/- 0.020 (in 2 folds),0.629,0.467,0.014,Unknown,disease.separate_past_exposures,414,6,420,0.014286,False,0.921 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds),0.919 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds)
elasticnet_cv.decision_thresholds_tuned,0.907 +/- 0.015 (in 3 folds),0.915 +/- 0.016 (in 3 folds),0.914 +/- 0.009 (in 3 folds),0.925 +/- 0.008 (in 3 folds),0.727 +/- 0.036 (in 3 folds),0.609 +/- 0.065 (in 3 folds),0.727,0.594,disease.separate_past_exposures,0.717 +/- 0.042 (in 3 folds),0.597 +/- 0.075 (in 3 folds),0.021 +/- 0.020 (in 2 folds),0.717,0.582,0.014,Unknown,disease.separate_past_exposures,414,6,420,0.014286,False,0.921 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds),0.919 +/- 0.000 (in 1 folds),0.930 +/- 0.000 (in 1 folds)
xgboost,0.904 +/- 0.005 (in 3 folds),0.910 +/- 0.007 (in 3 folds),0.910 +/- 0.003 (in 3 folds),0.920 +/- 0.003 (in 3 folds),0.756 +/- 0.019 (in 3 folds),0.642 +/- 0.029 (in 3 folds),0.757,0.64,disease.separate_past_exposures,0.733 +/- 0.036 (in 3 folds),0.616 +/- 0.052 (in 3 folds),0.046 +/- 0.015 (in 2 folds),0.733,0.611,0.031,Unknown,disease.separate_past_exposures,407,13,420,0.030952,False,0.903 +/- 0.000 (in 1 folds),0.910 +/- 0.000 (in 1 folds),0.914 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds)
xgboost.decision_thresholds_tuned,0.904 +/- 0.005 (in 3 folds),0.910 +/- 0.007 (in 3 folds),0.910 +/- 0.003 (in 3 folds),0.920 +/- 0.003 (in 3 folds),0.737 +/- 0.024 (in 3 folds),0.613 +/- 0.029 (in 3 folds),0.737,0.613,disease.separate_past_exposures,0.714 +/- 0.031 (in 3 folds),0.585 +/- 0.047 (in 3 folds),0.046 +/- 0.015 (in 2 folds),0.714,0.586,0.031,Unknown,disease.separate_past_exposures,407,13,420,0.030952,False,0.903 +/- 0.000 (in 1 folds),0.910 +/- 0.000 (in 1 folds),0.914 +/- 0.000 (in 1 folds),0.923 +/- 0.000 (in 1 folds)


lasso_multiclass,lasso_multiclass.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.920 +/- 0.020 (in 3 folds) ROC-AUC (macro OvO): 0.927 +/- 0.022 (in 3 folds) au-PRC (weighted OvO): 0.924 +/- 0.014 (in 3 folds) au-PRC (macro OvO): 0.932 +/- 0.015 (in 3 folds) Accuracy: 0.730 +/- 0.051 (in 3 folds) MCC: 0.611 +/- 0.069 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.729 MCC: 0.609 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.719 +/- 0.046 (in 3 folds) MCC: 0.599 +/- 0.063 (in 3 folds) Unknown/abstention proportion: 0.014 +/- 0.007 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.719 MCC: 0.597 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.62 0.79 0.69 47  HIV 0.91 0.83 0.87 87 Healthy/Background 0.78 0.76 0.77 191  Lupus 0.53 0.51 0.52 95  Unknown 0.00 0.00 0.00 0  accuracy 0.72 420  macro avg 0.57 0.58 0.57 420  weighted avg 0.73 0.72 0.73 420,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.920 +/- 0.020 (in 3 folds) ROC-AUC (macro OvO): 0.927 +/- 0.022 (in 3 folds) au-PRC (weighted OvO): 0.924 +/- 0.014 (in 3 folds) au-PRC (macro OvO): 0.932 +/- 0.015 (in 3 folds) Accuracy: 0.698 +/- 0.066 (in 3 folds) MCC: 0.596 +/- 0.069 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.698 MCC: 0.573 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.688 +/- 0.066 (in 3 folds) MCC: 0.583 +/- 0.072 (in 3 folds) Unknown/abstention proportion: 0.014 +/- 0.007 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.688 MCC: 0.560 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.81 0.74 0.78 47  HIV 0.92 0.76 0.83 87 Healthy/Background 0.77 0.68 0.72 191  Lupus 0.45 0.62 0.52 95  Unknown 0.00 0.00 0.00 0  accuracy 0.69 420  macro avg 0.59 0.56 0.57 420  weighted avg 0.73 0.69 0.70 420,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.915 +/- 0.017 (in 3 folds) ROC-AUC (macro OvO): 0.923 +/- 0.019 (in 3 folds) au-PRC (weighted OvO): 0.921 +/- 0.013 (in 3 folds) au-PRC (macro OvO): 0.930 +/- 0.014 (in 3 folds) Accuracy: 0.733 +/- 0.029 (in 3 folds) MCC: 0.605 +/- 0.038 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.733 MCC: 0.602 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.724 +/- 0.023 (in 3 folds) MCC: 0.595 +/- 0.033 (in 3 folds) Unknown/abstention proportion: 0.018 +/- 0.005 (in 2 folds) ROC-AUC (weighted OvO): 0.915 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.924 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.926 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.935 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.724 MCC: 0.592 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.92 0.72 0.81 47  HIV 0.89 0.82 0.85 87 Healthy/Background 0.72 0.82 0.77 191  Lupus 0.53 0.44 0.48 95  Unknown 0.00 0.00 0.00 0  accuracy 0.72 420  macro avg 0.61 0.56 0.58 420  weighted avg 0.73 0.72 0.72 420,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.915 +/- 0.017 (in 3 folds) ROC-AUC (macro OvO): 0.923 +/- 0.019 (in 3 folds) au-PRC (weighted OvO): 0.921 +/- 0.013 (in 3 folds) au-PRC (macro OvO): 0.930 +/- 0.014 (in 3 folds) Accuracy: 0.670 +/- 0.053 (in 3 folds) MCC: 0.559 +/- 0.057 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.670 MCC: 0.527 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.662 +/- 0.052 (in 3 folds) MCC: 0.548 +/- 0.054 (in 3 folds) Unknown/abstention proportion: 0.018 +/- 0.005 (in 2 folds) ROC-AUC (weighted OvO): 0.915 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.924 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.926 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.935 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.662 MCC: 0.518 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.89 0.68 0.77 47  HIV 0.90 0.72 0.80 87 Healthy/Background 0.73 0.67 0.70 191  Lupus 0.41 0.58 0.48 95  Unknown 0.00 0.00 0.00 0  accuracy 0.66 420  macro avg 0.59 0.53 0.55 420  weighted avg 0.71 0.66 0.68 420
,,,


ridge_cv,ridge_cv.decision_thresholds_tuned,elasticnet_cv,elasticnet_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.914 +/- 0.031 (in 3 folds) ROC-AUC (macro OvO): 0.923 +/- 0.031 (in 3 folds) au-PRC (weighted OvO): 0.924 +/- 0.015 (in 3 folds) au-PRC (macro OvO): 0.933 +/- 0.015 (in 3 folds) Accuracy: 0.527 +/- 0.160 (in 3 folds) MCC: 0.192 +/- 0.333 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.531 MCC: 0.302 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.502 +/- 0.174 (in 3 folds) MCC: 0.176 +/- 0.332 (in 3 folds) Unknown/abstention proportion: 0.055 +/- 0.065 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.502 MCC: 0.229 Unknown/abstention proportion: 0.055 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 1.00 0.13 0.23 47  HIV 1.00 0.24 0.39 87 Healthy/Background 0.49 0.95 0.65 191  Lupus 0.75 0.03 0.06 95  Unknown 0.00 0.00 0.00 0  accuracy 0.50 420  macro avg 0.65 0.27 0.27 420  weighted avg 0.71 0.50 0.42 420,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.914 +/- 0.031 (in 3 folds) ROC-AUC (macro OvO): 0.923 +/- 0.031 (in 3 folds) au-PRC (weighted OvO): 0.924 +/- 0.015 (in 3 folds) au-PRC (macro OvO): 0.933 +/- 0.015 (in 3 folds) Accuracy: 0.424 +/- 0.341 (in 3 folds) MCC: 0.218 +/- 0.378 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.423 MCC: 0.197 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.401 +/- 0.335 (in 3 folds) MCC: 0.207 +/- 0.373 (in 3 folds) Unknown/abstention proportion: 0.055 +/- 0.065 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.400 MCC: 0.182 Unknown/abstention proportion: 0.055 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.15 0.49 0.23 47  HIV 0.89 0.29 0.43 87 Healthy/Background 0.54 0.57 0.55 191  Lupus 0.63 0.13 0.21 95  Unknown 0.00 0.00 0.00 0  accuracy 0.40 420  macro avg 0.44 0.29 0.29 420  weighted avg 0.59 0.40 0.42 420,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.907 +/- 0.015 (in 3 folds) ROC-AUC (macro OvO): 0.915 +/- 0.016 (in 3 folds) au-PRC (weighted OvO): 0.914 +/- 0.009 (in 3 folds) au-PRC (macro OvO): 0.925 +/- 0.008 (in 3 folds) Accuracy: 0.637 +/- 0.132 (in 3 folds) MCC: 0.432 +/- 0.294 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.638 MCC: 0.481 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.629 +/- 0.141 (in 3 folds) MCC: 0.425 +/- 0.301 (in 3 folds) Unknown/abstention proportion: 0.021 +/- 0.020 (in 2 folds) ROC-AUC (weighted OvO): 0.921 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.930 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.919 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.930 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.629 MCC: 0.467 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 1.00 0.38 0.55 47  HIV 0.96 0.52 0.67 87 Healthy/Background 0.56 0.98 0.72 191  Lupus 0.82 0.15 0.25 95  Unknown 0.00 0.00 0.00 0  accuracy 0.63 420  macro avg 0.67 0.41 0.44 420  weighted avg 0.75 0.63 0.58 420,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.907 +/- 0.015 (in 3 folds) ROC-AUC (macro OvO): 0.915 +/- 0.016 (in 3 folds) au-PRC (weighted OvO): 0.914 +/- 0.009 (in 3 folds) au-PRC (macro OvO): 0.925 +/- 0.008 (in 3 folds) Accuracy: 0.727 +/- 0.036 (in 3 folds) MCC: 0.609 +/- 0.065 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.727 MCC: 0.594 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.717 +/- 0.042 (in 3 folds) MCC: 0.597 +/- 0.075 (in 3 folds) Unknown/abstention proportion: 0.021 +/- 0.020 (in 2 folds) ROC-AUC (weighted OvO): 0.921 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.930 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.919 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.930 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.717 MCC: 0.582 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.95 0.74 0.83 47  HIV 0.78 0.76 0.77 87 Healthy/Background 0.69 0.85 0.76 191  Lupus 0.66 0.39 0.49 95  Unknown 0.00 0.00 0.00 0  accuracy 0.72 420  macro avg 0.61 0.55 0.57 420  weighted avg 0.73 0.72 0.71 420
,,,


xgboost,xgboost.decision_thresholds_tuned,rf_multiclass,rf_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.904 +/- 0.005 (in 3 folds) ROC-AUC (macro OvO): 0.910 +/- 0.007 (in 3 folds) au-PRC (weighted OvO): 0.910 +/- 0.003 (in 3 folds) au-PRC (macro OvO): 0.920 +/- 0.003 (in 3 folds) Accuracy: 0.756 +/- 0.019 (in 3 folds) MCC: 0.642 +/- 0.029 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.757 MCC: 0.640 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.733 +/- 0.036 (in 3 folds) MCC: 0.616 +/- 0.052 (in 3 folds) Unknown/abstention proportion: 0.046 +/- 0.015 (in 2 folds) ROC-AUC (weighted OvO): 0.903 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.910 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.914 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.923 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.733 MCC: 0.611 Unknown/abstention proportion: 0.031 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.86 0.77 0.81 47  HIV 0.89 0.80 0.84 87 Healthy/Background 0.73 0.81 0.77 191  Lupus 0.63 0.51 0.56 95  Unknown 0.00 0.00 0.00 0  accuracy 0.73 420  macro avg 0.62 0.58 0.60 420  weighted avg 0.76 0.73 0.74 420,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.904 +/- 0.005 (in 3 folds) ROC-AUC (macro OvO): 0.910 +/- 0.007 (in 3 folds) au-PRC (weighted OvO): 0.910 +/- 0.003 (in 3 folds) au-PRC (macro OvO): 0.920 +/- 0.003 (in 3 folds) Accuracy: 0.737 +/- 0.024 (in 3 folds) MCC: 0.613 +/- 0.029 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.737 MCC: 0.613 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.714 +/- 0.031 (in 3 folds) MCC: 0.585 +/- 0.047 (in 3 folds) Unknown/abstention proportion: 0.046 +/- 0.015 (in 2 folds) ROC-AUC (weighted OvO): 0.903 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.910 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.914 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.923 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.714 MCC: 0.586 Unknown/abstention proportion: 0.031 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.80 0.77 0.78 47  HIV 0.79 0.82 0.80 87 Healthy/Background 0.72 0.79 0.75 191  Lupus 0.68 0.44 0.54 95  Unknown 0.00 0.00 0.00 0  accuracy 0.71 420  macro avg 0.60 0.56 0.57 420  weighted avg 0.73 0.71 0.72 420,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.895 +/- 0.006 (in 3 folds) ROC-AUC (macro OvO): 0.903 +/- 0.006 (in 3 folds) au-PRC (weighted OvO): 0.891 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.903 +/- 0.004 (in 3 folds) Accuracy: 0.740 +/- 0.017 (in 3 folds) MCC: 0.621 +/- 0.020 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.740 MCC: 0.616 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.726 +/- 0.021 (in 3 folds) MCC: 0.606 +/- 0.031 (in 3 folds) Unknown/abstention proportion: 0.028 +/- 0.010 (in 2 folds) ROC-AUC (weighted OvO): 0.902 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.911 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.895 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.907 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.726 MCC: 0.600 Unknown/abstention proportion: 0.019 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.74 0.79 0.76 47  HIV 0.89 0.83 0.86 87 Healthy/Background 0.73 0.83 0.77 191  Lupus 0.59 0.40 0.48 95  Unknown 0.00 0.00 0.00 0  accuracy 0.73 420  macro avg 0.59 0.57 0.57 420  weighted avg 0.73 0.73 0.72 420,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.895 +/- 0.006 (in 3 folds) ROC-AUC (macro OvO): 0.903 +/- 0.006 (in 3 folds) au-PRC (weighted OvO): 0.891 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.903 +/- 0.004 (in 3 folds) Accuracy: 0.721 +/- 0.023 (in 3 folds) MCC: 0.600 +/- 0.024 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.721 MCC: 0.584 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.707 +/- 0.019 (in 3 folds) MCC: 0.585 +/- 0.030 (in 3 folds) Unknown/abstention proportion: 0.028 +/- 0.010 (in 2 folds) ROC-AUC (weighted OvO): 0.902 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.911 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.895 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.907 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.707 MCC: 0.569 Unknown/abstention proportion: 0.019 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.79 0.70 0.74 47  HIV 0.88 0.83 0.85 87 Healthy/Background 0.69 0.82 0.75 191  Lupus 0.56 0.37 0.45 95  Unknown 0.00 0.00 0.00 0  accuracy 0.71 420  macro avg 0.58 0.54 0.56 420  weighted avg 0.71 0.71 0.70 420
,,,


lasso_cv,lasso_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.894 +/- 0.025 (in 3 folds) ROC-AUC (macro OvO): 0.905 +/- 0.029 (in 3 folds) au-PRC (weighted OvO): 0.906 +/- 0.016 (in 3 folds) au-PRC (macro OvO): 0.919 +/- 0.017 (in 3 folds) Accuracy: 0.590 +/- 0.105 (in 3 folds) MCC: 0.364 +/- 0.219 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.590 MCC: 0.394 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.586 +/- 0.108 (in 3 folds) MCC: 0.349 +/- 0.240 (in 3 folds) Unknown/abstention proportion: 0.011 +/- 0.005 (in 2 folds) ROC-AUC (weighted OvO): 0.896 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.909 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.898 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.912 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.586 MCC: 0.387 Unknown/abstention proportion: 0.007 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 1.00 0.38 0.55 47  HIV 1.00 0.38 0.55 87 Healthy/Background 0.53 0.96 0.69 191  Lupus 0.52 0.12 0.19 95  Unknown 0.00 0.00 0.00 0  accuracy 0.59 420  macro avg 0.61 0.37 0.40 420  weighted avg 0.68 0.59 0.53 420,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.894 +/- 0.025 (in 3 folds) ROC-AUC (macro OvO): 0.905 +/- 0.029 (in 3 folds) au-PRC (weighted OvO): 0.906 +/- 0.016 (in 3 folds) au-PRC (macro OvO): 0.919 +/- 0.017 (in 3 folds) Accuracy: 0.712 +/- 0.045 (in 3 folds) MCC: 0.584 +/- 0.056 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.712 MCC: 0.581 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.707 +/- 0.041 (in 3 folds) MCC: 0.578 +/- 0.053 (in 3 folds) Unknown/abstention proportion: 0.011 +/- 0.005 (in 2 folds) ROC-AUC (weighted OvO): 0.896 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.909 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.898 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.912 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.707 MCC: 0.574 Unknown/abstention proportion: 0.007 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.89 0.66 0.76 47  HIV 0.79 0.80 0.80 87 Healthy/Background 0.66 0.91 0.77 191  Lupus 0.73 0.23 0.35 95  Unknown 0.00 0.00 0.00 0  accuracy 0.71 420  macro avg 0.61 0.52 0.53 420  weighted avg 0.73 0.71 0.68 420
,


---

# GeneLocus.BCR, TargetObsColumnEnum.ethnicity_condensed_healthy_only trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.654 +/- 0.053 (in 3 folds),0.654 +/- 0.033 (in 3 folds),0.671 +/- 0.069 (in 3 folds),0.683 +/- 0.041 (in 3 folds),0.568 +/- 0.108 (in 3 folds),0.148 +/- 0.257 (in 3 folds),0.565,0.261,0.463 +/- 0.074 (in 3 folds),0.194 +/- 0.115 (in 3 folds),0.180 +/- 0.051 (in 3 folds),0.462,0.188,0.182,Unknown,108.0,24.0,132.0,0.181818,True,,,,
lasso_cv,0.633 +/- 0.068 (in 3 folds),0.621 +/- 0.056 (in 3 folds),0.655 +/- 0.085 (in 3 folds),0.651 +/- 0.062 (in 3 folds),0.519 +/- 0.120 (in 3 folds),0.069 +/- 0.119 (in 3 folds),0.513,0.15,0.437 +/- 0.056 (in 3 folds),0.131 +/- 0.051 (in 3 folds),0.143 +/- 0.097 (in 3 folds),0.439,0.11,0.144,Unknown,113.0,19.0,132.0,0.143939,True,,,,
rf_multiclass,0.628 +/- 0.041 (in 3 folds),0.622 +/- 0.029 (in 3 folds),0.636 +/- 0.023 (in 3 folds),0.618 +/- 0.014 (in 3 folds),0.579 +/- 0.026 (in 3 folds),0.295 +/- 0.101 (in 3 folds),0.581,0.318,0.543 +/- 0.061 (in 3 folds),0.257 +/- 0.071 (in 3 folds),0.095 +/- 0.072 (in 2 folds),0.545,0.288,0.061,Unknown,124.0,8.0,132.0,0.060606,True,0.634 +/- 0.000 (in 1 folds),0.634 +/- 0.000 (in 1 folds),0.619 +/- 0.000 (in 1 folds),0.605 +/- 0.000 (in 1 folds)
ridge_cv,0.618 +/- 0.107 (in 3 folds),0.636 +/- 0.120 (in 3 folds),0.621 +/- 0.117 (in 3 folds),0.647 +/- 0.132 (in 3 folds),0.529 +/- 0.111 (in 3 folds),0.059 +/- 0.101 (in 3 folds),0.528,0.115,0.430 +/- 0.061 (in 3 folds),0.129 +/- 0.048 (in 3 folds),0.180 +/- 0.051 (in 3 folds),0.432,0.122,0.182,Unknown,108.0,24.0,132.0,0.181818,True,,,,
xgboost,0.595 +/- 0.039 (in 3 folds),0.578 +/- 0.037 (in 3 folds),0.641 +/- 0.055 (in 3 folds),0.626 +/- 0.046 (in 3 folds),0.573 +/- 0.008 (in 3 folds),0.285 +/- 0.143 (in 3 folds),0.573,0.307,0.536 +/- 0.042 (in 3 folds),0.248 +/- 0.116 (in 3 folds),0.095 +/- 0.072 (in 2 folds),0.538,0.281,0.061,Unknown,124.0,8.0,132.0,0.060606,False,0.576 +/- 0.000 (in 1 folds),0.578 +/- 0.000 (in 1 folds),0.588 +/- 0.000 (in 1 folds),0.589 +/- 0.000 (in 1 folds)
lasso_multiclass,0.555 +/- 0.048 (in 3 folds),0.529 +/- 0.033 (in 3 folds),0.656 +/- 0.034 (in 3 folds),0.635 +/- 0.029 (in 3 folds),0.591 +/- 0.068 (in 3 folds),0.331 +/- 0.024 (in 3 folds),0.59,0.346,0.521 +/- 0.040 (in 3 folds),0.263 +/- 0.030 (in 3 folds),0.114 +/- 0.061 (in 3 folds),0.523,0.278,0.114,Unknown,117.0,15.0,132.0,0.113636,True,,,,
dummy_stratified,0.554 +/- 0.056 (in 3 folds),0.532 +/- 0.048 (in 3 folds),0.531 +/- 0.036 (in 3 folds),0.521 +/- 0.024 (in 3 folds),0.518 +/- 0.136 (in 3 folds),0.169 +/- 0.226 (in 3 folds),0.505,0.138,0.385 +/- 0.038 (in 3 folds),0.136 +/- 0.142 (in 3 folds),0.233 +/- 0.145 (in 3 folds),0.386,0.138,0.235,Unknown,101.0,31.0,132.0,0.234848,True,,,,
linearsvm_ovr,0.550 +/- 0.067 (in 3 folds),0.523 +/- 0.061 (in 3 folds),0.655 +/- 0.036 (in 3 folds),0.634 +/- 0.032 (in 3 folds),0.609 +/- 0.045 (in 3 folds),0.369 +/- 0.121 (in 3 folds),0.607,0.374,0.538 +/- 0.005 (in 3 folds),0.294 +/- 0.087 (in 3 folds),0.114 +/- 0.061 (in 3 folds),0.538,0.301,0.114,Unknown,117.0,15.0,132.0,0.113636,True,,,,
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.521 +/- 0.118 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.519,0.0,0.423 +/- 0.067 (in 3 folds),0.114 +/- 0.025 (in 3 folds),0.180 +/- 0.051 (in 3 folds),0.424,0.104,0.182,Unknown,108.0,24.0,132.0,0.181818,True,,,,
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.654 +/- 0.053 (in 3 folds),0.654 +/- 0.033 (in 3 folds),0.671 +/- 0.069 (in 3 folds),0.683 +/- 0.041 (in 3 folds),0.568 +/- 0.108 (in 3 folds),0.148 +/- 0.257 (in 3 folds),0.565,0.261,0.463 +/- 0.074 (in 3 folds),0.194 +/- 0.115 (in 3 folds),0.180 +/- 0.051 (in 3 folds),0.462,0.188,0.182,Unknown,108,24,132,0.181818,True,,,,
lasso_cv,0.633 +/- 0.068 (in 3 folds),0.621 +/- 0.056 (in 3 folds),0.655 +/- 0.085 (in 3 folds),0.651 +/- 0.062 (in 3 folds),0.519 +/- 0.120 (in 3 folds),0.069 +/- 0.119 (in 3 folds),0.513,0.15,0.437 +/- 0.056 (in 3 folds),0.131 +/- 0.051 (in 3 folds),0.143 +/- 0.097 (in 3 folds),0.439,0.11,0.144,Unknown,113,19,132,0.143939,True,,,,
rf_multiclass,0.628 +/- 0.041 (in 3 folds),0.622 +/- 0.029 (in 3 folds),0.636 +/- 0.023 (in 3 folds),0.618 +/- 0.014 (in 3 folds),0.579 +/- 0.026 (in 3 folds),0.295 +/- 0.101 (in 3 folds),0.581,0.318,0.543 +/- 0.061 (in 3 folds),0.257 +/- 0.071 (in 3 folds),0.095 +/- 0.072 (in 2 folds),0.545,0.288,0.061,Unknown,124,8,132,0.060606,True,0.634 +/- 0.000 (in 1 folds),0.634 +/- 0.000 (in 1 folds),0.619 +/- 0.000 (in 1 folds),0.605 +/- 0.000 (in 1 folds)
ridge_cv,0.618 +/- 0.107 (in 3 folds),0.636 +/- 0.120 (in 3 folds),0.621 +/- 0.117 (in 3 folds),0.647 +/- 0.132 (in 3 folds),0.529 +/- 0.111 (in 3 folds),0.059 +/- 0.101 (in 3 folds),0.528,0.115,0.430 +/- 0.061 (in 3 folds),0.129 +/- 0.048 (in 3 folds),0.180 +/- 0.051 (in 3 folds),0.432,0.122,0.182,Unknown,108,24,132,0.181818,True,,,,
xgboost,0.595 +/- 0.039 (in 3 folds),0.578 +/- 0.037 (in 3 folds),0.641 +/- 0.055 (in 3 folds),0.626 +/- 0.046 (in 3 folds),0.573 +/- 0.008 (in 3 folds),0.285 +/- 0.143 (in 3 folds),0.573,0.307,0.536 +/- 0.042 (in 3 folds),0.248 +/- 0.116 (in 3 folds),0.095 +/- 0.072 (in 2 folds),0.538,0.281,0.061,Unknown,124,8,132,0.060606,False,0.576 +/- 0.000 (in 1 folds),0.578 +/- 0.000 (in 1 folds),0.588 +/- 0.000 (in 1 folds),0.589 +/- 0.000 (in 1 folds)
lasso_multiclass,0.555 +/- 0.048 (in 3 folds),0.529 +/- 0.033 (in 3 folds),0.656 +/- 0.034 (in 3 folds),0.635 +/- 0.029 (in 3 folds),0.591 +/- 0.068 (in 3 folds),0.331 +/- 0.024 (in 3 folds),0.59,0.346,0.521 +/- 0.040 (in 3 folds),0.263 +/- 0.030 (in 3 folds),0.114 +/- 0.061 (in 3 folds),0.523,0.278,0.114,Unknown,117,15,132,0.113636,True,,,,
dummy_stratified,0.554 +/- 0.056 (in 3 folds),0.532 +/- 0.048 (in 3 folds),0.531 +/- 0.036 (in 3 folds),0.521 +/- 0.024 (in 3 folds),0.518 +/- 0.136 (in 3 folds),0.169 +/- 0.226 (in 3 folds),0.505,0.138,0.385 +/- 0.038 (in 3 folds),0.136 +/- 0.142 (in 3 folds),0.233 +/- 0.145 (in 3 folds),0.386,0.138,0.235,Unknown,101,31,132,0.234848,True,,,,
linearsvm_ovr,0.550 +/- 0.067 (in 3 folds),0.523 +/- 0.061 (in 3 folds),0.655 +/- 0.036 (in 3 folds),0.634 +/- 0.032 (in 3 folds),0.609 +/- 0.045 (in 3 folds),0.369 +/- 0.121 (in 3 folds),0.607,0.374,0.538 +/- 0.005 (in 3 folds),0.294 +/- 0.087 (in 3 folds),0.114 +/- 0.061 (in 3 folds),0.538,0.301,0.114,Unknown,117,15,132,0.113636,True,,,,
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.521 +/- 0.118 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.519,0.0,0.423 +/- 0.067 (in 3 folds),0.114 +/- 0.025 (in 3 folds),0.180 +/- 0.051 (in 3 folds),0.424,0.104,0.182,Unknown,108,24,132,0.181818,True,,,,


elasticnet_cv,lasso_cv,rf_multiclass,ridge_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.654 +/- 0.053 (in 3 folds) ROC-AUC (macro OvO): 0.654 +/- 0.033 (in 3 folds) au-PRC (weighted OvO): 0.671 +/- 0.069 (in 3 folds) au-PRC (macro OvO): 0.683 +/- 0.041 (in 3 folds) Accuracy: 0.568 +/- 0.108 (in 3 folds) MCC: 0.148 +/- 0.257 (in 3 folds) Global scores without abstention: Accuracy: 0.565 MCC: 0.261 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.463 +/- 0.074 (in 3 folds) MCC: 0.194 +/- 0.115 (in 3 folds) Unknown/abstention proportion: 0.180 +/- 0.051 (in 3 folds) Global scores with abstention: Accuracy: 0.462 MCC: 0.188 Unknown/abstention proportion: 0.182 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.14 0.24 36  Asian 0.00 0.00 0.00 30  Caucasian 0.54 0.92 0.68 61 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.46 132  macro avg 0.31 0.21 0.19 132  weighted avg 0.52 0.46 0.38 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.633 +/- 0.068 (in 3 folds) ROC-AUC (macro OvO): 0.621 +/- 0.056 (in 3 folds) au-PRC (weighted OvO): 0.655 +/- 0.085 (in 3 folds) au-PRC (macro OvO): 0.651 +/- 0.062 (in 3 folds) Accuracy: 0.519 +/- 0.120 (in 3 folds) MCC: 0.069 +/- 0.119 (in 3 folds) Global scores without abstention: Accuracy: 0.513 MCC: 0.150 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.437 +/- 0.056 (in 3 folds) MCC: 0.131 +/- 0.051 (in 3 folds) Unknown/abstention proportion: 0.143 +/- 0.097 (in 3 folds) Global scores with abstention: Accuracy: 0.439 MCC: 0.110 Unknown/abstention proportion: 0.144 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.06 0.11 36  Asian 0.00 0.00 0.00 30  Caucasian 0.50 0.92 0.65 61 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.44 132  macro avg 0.30 0.19 0.15 132  weighted avg 0.51 0.44 0.33 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.628 +/- 0.041 (in 3 folds) ROC-AUC (macro OvO): 0.622 +/- 0.029 (in 3 folds) au-PRC (weighted OvO): 0.636 +/- 0.023 (in 3 folds) au-PRC (macro OvO): 0.618 +/- 0.014 (in 3 folds) Accuracy: 0.579 +/- 0.026 (in 3 folds) MCC: 0.295 +/- 0.101 (in 3 folds) Global scores without abstention: Accuracy: 0.581 MCC: 0.318 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.543 +/- 0.061 (in 3 folds) MCC: 0.257 +/- 0.071 (in 3 folds) Unknown/abstention proportion: 0.095 +/- 0.072 (in 2 folds) ROC-AUC (weighted OvO): 0.634 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.634 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.619 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.605 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.545 MCC: 0.288 Unknown/abstention proportion: 0.061 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.63 0.53 0.58 36  Asian 0.00 0.00 0.00 30  Caucasian 0.56 0.87 0.68 61 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.55 132  macro avg 0.24 0.28 0.25 132  weighted avg 0.43 0.55 0.47 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.618 +/- 0.107 (in 3 folds) ROC-AUC (macro OvO): 0.636 +/- 0.120 (in 3 folds) au-PRC (weighted OvO): 0.621 +/- 0.117 (in 3 folds) au-PRC (macro OvO): 0.647 +/- 0.132 (in 3 folds) Accuracy: 0.529 +/- 0.111 (in 3 folds) MCC: 0.059 +/- 0.101 (in 3 folds) Global scores without abstention: Accuracy: 0.528 MCC: 0.115 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.430 +/- 0.061 (in 3 folds) MCC: 0.129 +/- 0.048 (in 3 folds) Unknown/abstention proportion: 0.180 +/- 0.051 (in 3 folds) Global scores with abstention: Accuracy: 0.432 MCC: 0.122 Unknown/abstention proportion: 0.182 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.03 0.05 36  Asian 0.00 0.00 0.00 30  Caucasian 0.52 0.92 0.67 61 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.43 132  macro avg 0.30 0.19 0.14 132  weighted avg 0.51 0.43 0.32 132
,,,


xgboost,lasso_multiclass,dummy_stratified,linearsvm_ovr
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.595 +/- 0.039 (in 3 folds) ROC-AUC (macro OvO): 0.578 +/- 0.037 (in 3 folds) au-PRC (weighted OvO): 0.641 +/- 0.055 (in 3 folds) au-PRC (macro OvO): 0.626 +/- 0.046 (in 3 folds) Accuracy: 0.573 +/- 0.008 (in 3 folds) MCC: 0.285 +/- 0.143 (in 3 folds) Global scores without abstention: Accuracy: 0.573 MCC: 0.307 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.536 +/- 0.042 (in 3 folds) MCC: 0.248 +/- 0.116 (in 3 folds) Unknown/abstention proportion: 0.095 +/- 0.072 (in 2 folds) ROC-AUC (weighted OvO): 0.576 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.578 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.588 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.589 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.538 MCC: 0.281 Unknown/abstention proportion: 0.061 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.66 0.53 0.58 36  Asian 0.67 0.07 0.12 30  Caucasian 0.56 0.82 0.67 61 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.54 132  macro avg 0.38 0.28 0.27 132  weighted avg 0.59 0.54 0.50 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.555 +/- 0.048 (in 3 folds) ROC-AUC (macro OvO): 0.529 +/- 0.033 (in 3 folds) au-PRC (weighted OvO): 0.656 +/- 0.034 (in 3 folds) au-PRC (macro OvO): 0.635 +/- 0.029 (in 3 folds) Accuracy: 0.591 +/- 0.068 (in 3 folds) MCC: 0.331 +/- 0.024 (in 3 folds) Global scores without abstention: Accuracy: 0.590 MCC: 0.346 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.521 +/- 0.040 (in 3 folds) MCC: 0.263 +/- 0.030 (in 3 folds) Unknown/abstention proportion: 0.114 +/- 0.061 (in 3 folds) Global scores with abstention: Accuracy: 0.523 MCC: 0.278 Unknown/abstention proportion: 0.114 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.62 0.64 0.63 36  Asian 0.00 0.00 0.00 30  Caucasian 0.57 0.75 0.65 61 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.52 132  macro avg 0.24 0.28 0.26 132  weighted avg 0.44 0.52 0.47 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.554 +/- 0.056 (in 3 folds) ROC-AUC (macro OvO): 0.532 +/- 0.048 (in 3 folds) au-PRC (weighted OvO): 0.531 +/- 0.036 (in 3 folds) au-PRC (macro OvO): 0.521 +/- 0.024 (in 3 folds) Accuracy: 0.518 +/- 0.136 (in 3 folds) MCC: 0.169 +/- 0.226 (in 3 folds) Global scores without abstention: Accuracy: 0.505 MCC: 0.138 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.385 +/- 0.038 (in 3 folds) MCC: 0.136 +/- 0.142 (in 3 folds) Unknown/abstention proportion: 0.233 +/- 0.145 (in 3 folds) Global scores with abstention: Accuracy: 0.386 MCC: 0.138 Unknown/abstention proportion: 0.235 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.11 0.03 0.04 36  Asian 0.44 0.37 0.40 30  Caucasian 0.58 0.64 0.61 61 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.39 132  macro avg 0.23 0.21 0.21 132  weighted avg 0.40 0.39 0.38 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.550 +/- 0.067 (in 3 folds) ROC-AUC (macro OvO): 0.523 +/- 0.061 (in 3 folds) au-PRC (weighted OvO): 0.655 +/- 0.036 (in 3 folds) au-PRC (macro OvO): 0.634 +/- 0.032 (in 3 folds) Accuracy: 0.609 +/- 0.045 (in 3 folds) MCC: 0.369 +/- 0.121 (in 3 folds) Global scores without abstention: Accuracy: 0.607 MCC: 0.374 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.538 +/- 0.005 (in 3 folds) MCC: 0.294 +/- 0.087 (in 3 folds) Unknown/abstention proportion: 0.114 +/- 0.061 (in 3 folds) Global scores with abstention: Accuracy: 0.538 MCC: 0.301 Unknown/abstention proportion: 0.114 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.68 0.64 0.66 36  Asian 0.00 0.00 0.00 30  Caucasian 0.59 0.79 0.67 61 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.54 132  macro avg 0.25 0.29 0.27 132  weighted avg 0.46 0.54 0.49 132
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 3 folds) Accuracy: 0.521 +/- 0.118 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.519 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.423 +/- 0.067 (in 3 folds) MCC: 0.114 +/- 0.025 (in 3 folds) Unknown/abstention proportion: 0.180 +/- 0.051 (in 3 folds) Global scores with abstention: Accuracy: 0.424 MCC: 0.104 Unknown/abstention proportion: 0.182 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.00 0.00 0.00 36  Asian 0.00 0.00 0.00 30  Caucasian 0.52 0.92 0.66 61 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.42 132  macro avg 0.10 0.18 0.13 132  weighted avg 0.24 0.42 0.31 132


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.639 +/- 0.040 (in 3 folds),0.664 +/- 0.060 (in 3 folds),0.660 +/- 0.035 (in 3 folds),0.682 +/- 0.056 (in 3 folds),0.597 +/- 0.074 (in 3 folds),0.132 +/- 0.122 (in 3 folds),0.601,0.174,0.540 +/- 0.080 (in 3 folds),0.099 +/- 0.103 (in 3 folds),0.096 +/- 0.047 (in 3 folds),0.545,0.11,0.094,Unknown,173.0,18.0,191.0,0.094241,True,,,,
elasticnet_cv.decision_thresholds_tuned,0.639 +/- 0.040 (in 3 folds),0.664 +/- 0.060 (in 3 folds),0.660 +/- 0.035 (in 3 folds),0.682 +/- 0.056 (in 3 folds),0.519 +/- 0.101 (in 3 folds),0.261 +/- 0.044 (in 3 folds),0.52,0.216,0.471 +/- 0.111 (in 3 folds),0.220 +/- 0.047 (in 3 folds),0.096 +/- 0.047 (in 3 folds),0.471,0.189,0.094,Unknown,173.0,18.0,191.0,0.094241,False,,,,
lasso_cv,0.618 +/- 0.052 (in 3 folds),0.636 +/- 0.091 (in 3 folds),0.635 +/- 0.038 (in 3 folds),0.649 +/- 0.073 (in 3 folds),0.597 +/- 0.103 (in 3 folds),0.163 +/- 0.166 (in 3 folds),0.602,0.191,0.550 +/- 0.113 (in 3 folds),0.111 +/- 0.113 (in 3 folds),0.081 +/- 0.050 (in 3 folds),0.555,0.11,0.079,Unknown,176.0,15.0,191.0,0.078534,True,,,,
lasso_cv.decision_thresholds_tuned,0.618 +/- 0.052 (in 3 folds),0.636 +/- 0.091 (in 3 folds),0.635 +/- 0.038 (in 3 folds),0.649 +/- 0.073 (in 3 folds),0.499 +/- 0.145 (in 3 folds),0.219 +/- 0.115 (in 3 folds),0.494,0.204,0.456 +/- 0.127 (in 3 folds),0.181 +/- 0.082 (in 3 folds),0.081 +/- 0.050 (in 3 folds),0.455,0.184,0.079,Unknown,176.0,15.0,191.0,0.078534,False,,,,
rf_multiclass,0.612 +/- 0.066 (in 3 folds),0.620 +/- 0.073 (in 3 folds),0.634 +/- 0.077 (in 3 folds),0.641 +/- 0.108 (in 3 folds),0.568 +/- 0.078 (in 3 folds),0.165 +/- 0.172 (in 3 folds),0.571,0.143,0.547 +/- 0.062 (in 3 folds),0.153 +/- 0.158 (in 3 folds),0.053 +/- 0.010 (in 2 folds),0.55,0.138,0.037,Unknown,184.0,7.0,191.0,0.036649,True,0.688 +/- 0.000 (in 1 folds),0.702 +/- 0.000 (in 1 folds),0.722 +/- 0.000 (in 1 folds),0.764 +/- 0.000 (in 1 folds)
rf_multiclass.decision_thresholds_tuned,0.612 +/- 0.066 (in 3 folds),0.620 +/- 0.073 (in 3 folds),0.634 +/- 0.077 (in 3 folds),0.641 +/- 0.108 (in 3 folds),0.619 +/- 0.027 (in 3 folds),0.282 +/- 0.043 (in 3 folds),0.62,0.253,0.597 +/- 0.019 (in 3 folds),0.265 +/- 0.059 (in 3 folds),0.053 +/- 0.010 (in 2 folds),0.597,0.235,0.037,Unknown,184.0,7.0,191.0,0.036649,True,0.688 +/- 0.000 (in 1 folds),0.702 +/- 0.000 (in 1 folds),0.722 +/- 0.000 (in 1 folds),0.764 +/- 0.000 (in 1 folds)
ridge_cv,0.586 +/- 0.076 (in 3 folds),0.603 +/- 0.092 (in 3 folds),0.605 +/- 0.094 (in 3 folds),0.621 +/- 0.105 (in 3 folds),0.569 +/- 0.076 (in 3 folds),-0.022 +/- 0.037 (in 3 folds),0.572,-0.045,0.514 +/- 0.077 (in 3 folds),0.015 +/- 0.023 (in 3 folds),0.096 +/- 0.047 (in 3 folds),0.518,0.01,0.094,Unknown,173.0,18.0,191.0,0.094241,True,,,,
ridge_cv.decision_thresholds_tuned,0.586 +/- 0.076 (in 3 folds),0.603 +/- 0.092 (in 3 folds),0.605 +/- 0.094 (in 3 folds),0.621 +/- 0.105 (in 3 folds),0.356 +/- 0.244 (in 3 folds),0.044 +/- 0.077 (in 3 folds),0.358,0.084,0.319 +/- 0.217 (in 3 folds),0.004 +/- 0.098 (in 3 folds),0.096 +/- 0.047 (in 3 folds),0.325,0.074,0.094,Unknown,173.0,18.0,191.0,0.094241,True,,,,
xgboost,0.571 +/- 0.025 (in 3 folds),0.556 +/- 0.031 (in 3 folds),0.623 +/- 0.023 (in 3 folds),0.624 +/- 0.046 (in 3 folds),0.563 +/- 0.084 (in 3 folds),0.182 +/- 0.139 (in 3 folds),0.565,0.169,0.541 +/- 0.066 (in 3 folds),0.172 +/- 0.130 (in 3 folds),0.053 +/- 0.010 (in 2 folds),0.545,0.162,0.037,Unknown,184.0,7.0,191.0,0.036649,False,0.596 +/- 0.000 (in 1 folds),0.592 +/- 0.000 (in 1 folds),0.649 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds)
xgboost.decision_thresholds_tuned,0.571 +/- 0.025 (in 3 folds),0.556 +/- 0.031 (in 3 folds),0.623 +/- 0.023 (in 3 folds),0.624 +/- 0.046 (in 3 folds),0.481 +/- 0.124 (in 3 folds),0.279 +/- 0.033 (in 3 folds),0.484,0.231,0.463 +/- 0.113 (in 3 folds),0.266 +/- 0.038 (in 3 folds),0.053 +/- 0.010 (in 2 folds),0.466,0.221,0.037,Unknown,184.0,7.0,191.0,0.036649,False,0.596 +/- 0.000 (in 1 folds),0.592 +/- 0.000 (in 1 folds),0.649 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds)

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.639 +/- 0.040 (in 3 folds),0.664 +/- 0.060 (in 3 folds),0.660 +/- 0.035 (in 3 folds),0.682 +/- 0.056 (in 3 folds),0.597 +/- 0.074 (in 3 folds),0.132 +/- 0.122 (in 3 folds),0.601,0.174,0.540 +/- 0.080 (in 3 folds),0.099 +/- 0.103 (in 3 folds),0.096 +/- 0.047 (in 3 folds),0.545,0.11,0.094,Unknown,173,18,191,0.094241,True,,,,
elasticnet_cv.decision_thresholds_tuned,0.639 +/- 0.040 (in 3 folds),0.664 +/- 0.060 (in 3 folds),0.660 +/- 0.035 (in 3 folds),0.682 +/- 0.056 (in 3 folds),0.519 +/- 0.101 (in 3 folds),0.261 +/- 0.044 (in 3 folds),0.52,0.216,0.471 +/- 0.111 (in 3 folds),0.220 +/- 0.047 (in 3 folds),0.096 +/- 0.047 (in 3 folds),0.471,0.189,0.094,Unknown,173,18,191,0.094241,False,,,,
lasso_cv,0.618 +/- 0.052 (in 3 folds),0.636 +/- 0.091 (in 3 folds),0.635 +/- 0.038 (in 3 folds),0.649 +/- 0.073 (in 3 folds),0.597 +/- 0.103 (in 3 folds),0.163 +/- 0.166 (in 3 folds),0.602,0.191,0.550 +/- 0.113 (in 3 folds),0.111 +/- 0.113 (in 3 folds),0.081 +/- 0.050 (in 3 folds),0.555,0.11,0.079,Unknown,176,15,191,0.078534,True,,,,
lasso_cv.decision_thresholds_tuned,0.618 +/- 0.052 (in 3 folds),0.636 +/- 0.091 (in 3 folds),0.635 +/- 0.038 (in 3 folds),0.649 +/- 0.073 (in 3 folds),0.499 +/- 0.145 (in 3 folds),0.219 +/- 0.115 (in 3 folds),0.494,0.204,0.456 +/- 0.127 (in 3 folds),0.181 +/- 0.082 (in 3 folds),0.081 +/- 0.050 (in 3 folds),0.455,0.184,0.079,Unknown,176,15,191,0.078534,False,,,,
rf_multiclass,0.612 +/- 0.066 (in 3 folds),0.620 +/- 0.073 (in 3 folds),0.634 +/- 0.077 (in 3 folds),0.641 +/- 0.108 (in 3 folds),0.568 +/- 0.078 (in 3 folds),0.165 +/- 0.172 (in 3 folds),0.571,0.143,0.547 +/- 0.062 (in 3 folds),0.153 +/- 0.158 (in 3 folds),0.053 +/- 0.010 (in 2 folds),0.55,0.138,0.037,Unknown,184,7,191,0.036649,True,0.688 +/- 0.000 (in 1 folds),0.702 +/- 0.000 (in 1 folds),0.722 +/- 0.000 (in 1 folds),0.764 +/- 0.000 (in 1 folds)
rf_multiclass.decision_thresholds_tuned,0.612 +/- 0.066 (in 3 folds),0.620 +/- 0.073 (in 3 folds),0.634 +/- 0.077 (in 3 folds),0.641 +/- 0.108 (in 3 folds),0.619 +/- 0.027 (in 3 folds),0.282 +/- 0.043 (in 3 folds),0.62,0.253,0.597 +/- 0.019 (in 3 folds),0.265 +/- 0.059 (in 3 folds),0.053 +/- 0.010 (in 2 folds),0.597,0.235,0.037,Unknown,184,7,191,0.036649,True,0.688 +/- 0.000 (in 1 folds),0.702 +/- 0.000 (in 1 folds),0.722 +/- 0.000 (in 1 folds),0.764 +/- 0.000 (in 1 folds)
ridge_cv,0.586 +/- 0.076 (in 3 folds),0.603 +/- 0.092 (in 3 folds),0.605 +/- 0.094 (in 3 folds),0.621 +/- 0.105 (in 3 folds),0.569 +/- 0.076 (in 3 folds),-0.022 +/- 0.037 (in 3 folds),0.572,-0.045,0.514 +/- 0.077 (in 3 folds),0.015 +/- 0.023 (in 3 folds),0.096 +/- 0.047 (in 3 folds),0.518,0.01,0.094,Unknown,173,18,191,0.094241,True,,,,
ridge_cv.decision_thresholds_tuned,0.586 +/- 0.076 (in 3 folds),0.603 +/- 0.092 (in 3 folds),0.605 +/- 0.094 (in 3 folds),0.621 +/- 0.105 (in 3 folds),0.356 +/- 0.244 (in 3 folds),0.044 +/- 0.077 (in 3 folds),0.358,0.084,0.319 +/- 0.217 (in 3 folds),0.004 +/- 0.098 (in 3 folds),0.096 +/- 0.047 (in 3 folds),0.325,0.074,0.094,Unknown,173,18,191,0.094241,True,,,,
xgboost,0.571 +/- 0.025 (in 3 folds),0.556 +/- 0.031 (in 3 folds),0.623 +/- 0.023 (in 3 folds),0.624 +/- 0.046 (in 3 folds),0.563 +/- 0.084 (in 3 folds),0.182 +/- 0.139 (in 3 folds),0.565,0.169,0.541 +/- 0.066 (in 3 folds),0.172 +/- 0.130 (in 3 folds),0.053 +/- 0.010 (in 2 folds),0.545,0.162,0.037,Unknown,184,7,191,0.036649,False,0.596 +/- 0.000 (in 1 folds),0.592 +/- 0.000 (in 1 folds),0.649 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds)
xgboost.decision_thresholds_tuned,0.571 +/- 0.025 (in 3 folds),0.556 +/- 0.031 (in 3 folds),0.623 +/- 0.023 (in 3 folds),0.624 +/- 0.046 (in 3 folds),0.481 +/- 0.124 (in 3 folds),0.279 +/- 0.033 (in 3 folds),0.484,0.231,0.463 +/- 0.113 (in 3 folds),0.266 +/- 0.038 (in 3 folds),0.053 +/- 0.010 (in 2 folds),0.466,0.221,0.037,Unknown,184,7,191,0.036649,False,0.596 +/- 0.000 (in 1 folds),0.592 +/- 0.000 (in 1 folds),0.649 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds)


elasticnet_cv,elasticnet_cv.decision_thresholds_tuned,lasso_cv,lasso_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.639 +/- 0.040 (in 3 folds) ROC-AUC (macro OvO): 0.664 +/- 0.060 (in 3 folds) au-PRC (weighted OvO): 0.660 +/- 0.035 (in 3 folds) au-PRC (macro OvO): 0.682 +/- 0.056 (in 3 folds) Accuracy: 0.597 +/- 0.074 (in 3 folds) MCC: 0.132 +/- 0.122 (in 3 folds) Global scores without abstention: Accuracy: 0.601 MCC: 0.174 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.540 +/- 0.080 (in 3 folds) MCC: 0.099 +/- 0.103 (in 3 folds) Unknown/abstention proportion: 0.096 +/- 0.047 (in 3 folds) Global scores with abstention: Accuracy: 0.545 MCC: 0.110 Unknown/abstention proportion: 0.094 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.75 0.14 0.23 44  Asian 0.00 0.00 0.00 32  Caucasian 0.59 0.90 0.72 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.54 191  macro avg 0.27 0.21 0.19 191  weighted avg 0.51 0.54 0.46 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.639 +/- 0.040 (in 3 folds) ROC-AUC (macro OvO): 0.664 +/- 0.060 (in 3 folds) au-PRC (weighted OvO): 0.660 +/- 0.035 (in 3 folds) au-PRC (macro OvO): 0.682 +/- 0.056 (in 3 folds) Accuracy: 0.519 +/- 0.101 (in 3 folds) MCC: 0.261 +/- 0.044 (in 3 folds) Global scores without abstention: Accuracy: 0.520 MCC: 0.216 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.471 +/- 0.111 (in 3 folds) MCC: 0.220 +/- 0.047 (in 3 folds) Unknown/abstention proportion: 0.096 +/- 0.047 (in 3 folds) Global scores with abstention: Accuracy: 0.471 MCC: 0.189 Unknown/abstention proportion: 0.094 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.50 0.55 0.52 44  Asian 0.21 0.22 0.21 32  Caucasian 0.67 0.54 0.60 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.47 191  macro avg 0.28 0.26 0.27 191  weighted avg 0.53 0.47 0.50 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.618 +/- 0.052 (in 3 folds) ROC-AUC (macro OvO): 0.636 +/- 0.091 (in 3 folds) au-PRC (weighted OvO): 0.635 +/- 0.038 (in 3 folds) au-PRC (macro OvO): 0.649 +/- 0.073 (in 3 folds) Accuracy: 0.597 +/- 0.103 (in 3 folds) MCC: 0.163 +/- 0.166 (in 3 folds) Global scores without abstention: Accuracy: 0.602 MCC: 0.191 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.550 +/- 0.113 (in 3 folds) MCC: 0.111 +/- 0.113 (in 3 folds) Unknown/abstention proportion: 0.081 +/- 0.050 (in 3 folds) Global scores with abstention: Accuracy: 0.555 MCC: 0.110 Unknown/abstention proportion: 0.079 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.09 0.17 44  Asian 0.00 0.00 0.00 32  Caucasian 0.59 0.94 0.73 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.55 191  macro avg 0.32 0.21 0.18 191  weighted avg 0.57 0.55 0.45 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.618 +/- 0.052 (in 3 folds) ROC-AUC (macro OvO): 0.636 +/- 0.091 (in 3 folds) au-PRC (weighted OvO): 0.635 +/- 0.038 (in 3 folds) au-PRC (macro OvO): 0.649 +/- 0.073 (in 3 folds) Accuracy: 0.499 +/- 0.145 (in 3 folds) MCC: 0.219 +/- 0.115 (in 3 folds) Global scores without abstention: Accuracy: 0.494 MCC: 0.204 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.456 +/- 0.127 (in 3 folds) MCC: 0.181 +/- 0.082 (in 3 folds) Unknown/abstention proportion: 0.081 +/- 0.050 (in 3 folds) Global scores with abstention: Accuracy: 0.455 MCC: 0.184 Unknown/abstention proportion: 0.079 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.52 0.50 0.51 44  Asian 0.20 0.31 0.24 32  Caucasian 0.68 0.50 0.58 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.46 191  macro avg 0.28 0.26 0.27 191  weighted avg 0.54 0.46 0.49 191
,,,


rf_multiclass,rf_multiclass.decision_thresholds_tuned,ridge_cv,ridge_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.612 +/- 0.066 (in 3 folds) ROC-AUC (macro OvO): 0.620 +/- 0.073 (in 3 folds) au-PRC (weighted OvO): 0.634 +/- 0.077 (in 3 folds) au-PRC (macro OvO): 0.641 +/- 0.108 (in 3 folds) Accuracy: 0.568 +/- 0.078 (in 3 folds) MCC: 0.165 +/- 0.172 (in 3 folds) Global scores without abstention: Accuracy: 0.571 MCC: 0.143 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.547 +/- 0.062 (in 3 folds) MCC: 0.153 +/- 0.158 (in 3 folds) Unknown/abstention proportion: 0.053 +/- 0.010 (in 2 folds) ROC-AUC (weighted OvO): 0.688 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.702 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.722 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.764 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.550 MCC: 0.138 Unknown/abstention proportion: 0.037 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.50 0.34 0.41 44  Asian 0.20 0.03 0.05 32  Caucasian 0.60 0.82 0.69 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.55 191  macro avg 0.26 0.24 0.23 191  weighted avg 0.49 0.55 0.50 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.612 +/- 0.066 (in 3 folds) ROC-AUC (macro OvO): 0.620 +/- 0.073 (in 3 folds) au-PRC (weighted OvO): 0.634 +/- 0.077 (in 3 folds) au-PRC (macro OvO): 0.641 +/- 0.108 (in 3 folds) Accuracy: 0.619 +/- 0.027 (in 3 folds) MCC: 0.282 +/- 0.043 (in 3 folds) Global scores without abstention: Accuracy: 0.620 MCC: 0.253 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.597 +/- 0.019 (in 3 folds) MCC: 0.265 +/- 0.059 (in 3 folds) Unknown/abstention proportion: 0.053 +/- 0.010 (in 2 folds) ROC-AUC (weighted OvO): 0.688 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.702 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.722 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.764 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.597 MCC: 0.235 Unknown/abstention proportion: 0.037 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.66 0.43 0.52 44  Asian 0.25 0.03 0.06 32  Caucasian 0.62 0.86 0.72 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.60 191  macro avg 0.31 0.27 0.26 191  weighted avg 0.55 0.60 0.54 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.586 +/- 0.076 (in 3 folds) ROC-AUC (macro OvO): 0.603 +/- 0.092 (in 3 folds) au-PRC (weighted OvO): 0.605 +/- 0.094 (in 3 folds) au-PRC (macro OvO): 0.621 +/- 0.105 (in 3 folds) Accuracy: 0.569 +/- 0.076 (in 3 folds) MCC: -0.022 +/- 0.037 (in 3 folds) Global scores without abstention: Accuracy: 0.572 MCC: -0.045 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.514 +/- 0.077 (in 3 folds) MCC: 0.015 +/- 0.023 (in 3 folds) Unknown/abstention proportion: 0.096 +/- 0.047 (in 3 folds) Global scores with abstention: Accuracy: 0.518 MCC: 0.010 Unknown/abstention proportion: 0.094 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.00 0.00 0.00 44  Asian 0.00 0.00 0.00 32  Caucasian 0.58 0.91 0.70 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.52 191  macro avg 0.12 0.18 0.14 191  weighted avg 0.33 0.52 0.40 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.586 +/- 0.076 (in 3 folds) ROC-AUC (macro OvO): 0.603 +/- 0.092 (in 3 folds) au-PRC (weighted OvO): 0.605 +/- 0.094 (in 3 folds) au-PRC (macro OvO): 0.621 +/- 0.105 (in 3 folds) Accuracy: 0.356 +/- 0.244 (in 3 folds) MCC: 0.044 +/- 0.077 (in 3 folds) Global scores without abstention: Accuracy: 0.358 MCC: 0.084 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.319 +/- 0.217 (in 3 folds) MCC: 0.004 +/- 0.098 (in 3 folds) Unknown/abstention proportion: 0.096 +/- 0.047 (in 3 folds) Global scores with abstention: Accuracy: 0.325 MCC: 0.074 Unknown/abstention proportion: 0.094 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.28 0.36 0.31 44  Asian 0.18 0.38 0.25 32  Caucasian 0.68 0.31 0.43 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.32 191  macro avg 0.23 0.21 0.20 191  weighted avg 0.48 0.32 0.36 191
,,,


xgboost,xgboost.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.571 +/- 0.025 (in 3 folds) ROC-AUC (macro OvO): 0.556 +/- 0.031 (in 3 folds) au-PRC (weighted OvO): 0.623 +/- 0.023 (in 3 folds) au-PRC (macro OvO): 0.624 +/- 0.046 (in 3 folds) Accuracy: 0.563 +/- 0.084 (in 3 folds) MCC: 0.182 +/- 0.139 (in 3 folds) Global scores without abstention: Accuracy: 0.565 MCC: 0.169 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.541 +/- 0.066 (in 3 folds) MCC: 0.172 +/- 0.130 (in 3 folds) Unknown/abstention proportion: 0.053 +/- 0.010 (in 2 folds) ROC-AUC (weighted OvO): 0.596 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.592 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.649 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.677 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.545 MCC: 0.162 Unknown/abstention proportion: 0.037 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.45 0.34 0.39 44  Asian 0.43 0.09 0.15 32  Caucasian 0.62 0.79 0.69 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.54 191  macro avg 0.30 0.24 0.25 191  weighted avg 0.53 0.54 0.51 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.571 +/- 0.025 (in 3 folds) ROC-AUC (macro OvO): 0.556 +/- 0.031 (in 3 folds) au-PRC (weighted OvO): 0.623 +/- 0.023 (in 3 folds) au-PRC (macro OvO): 0.624 +/- 0.046 (in 3 folds) Accuracy: 0.481 +/- 0.124 (in 3 folds) MCC: 0.279 +/- 0.033 (in 3 folds) Global scores without abstention: Accuracy: 0.484 MCC: 0.231 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.463 +/- 0.113 (in 3 folds) MCC: 0.266 +/- 0.038 (in 3 folds) Unknown/abstention proportion: 0.053 +/- 0.010 (in 2 folds) ROC-AUC (weighted OvO): 0.596 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.592 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.649 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.677 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.466 MCC: 0.221 Unknown/abstention proportion: 0.037 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.50 0.68 0.58 44  Asian 0.33 0.19 0.24 32  Caucasian 0.66 0.47 0.55 109 Hispanic/Latino 0.07 0.33 0.11 6  Unknown 0.00 0.00 0.00 0  accuracy 0.47 191  macro avg 0.31 0.33 0.30 191  weighted avg 0.55 0.47 0.49 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.540 +/- 0.023 (in 3 folds) ROC-AUC (macro OvO): 0.514 +/- 0.015 (in 3 folds) au-PRC (weighted OvO): 0.613 +/- 0.032 (in 3 folds) au-PRC (macro OvO): 0.591 +/- 0.024 (in 3 folds) Accuracy: 0.604 +/- 0.015 (in 3 folds) MCC: 0.271 +/- 0.022 (in 3 folds) Global scores without abstention: Accuracy: 0.604 MCC: 0.244 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.576 +/- 0.007 (in 3 folds) MCC: 0.250 +/- 0.016 (in 3 folds) Unknown/abstention proportion: 0.047 +/- 0.013 (in 3 folds) Global scores with abstention: Accuracy: 0.576 MCC: 0.225 Unknown/abstention proportion: 0.047 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.49 0.48 0.48 44  Asian 0.67 0.06 0.11 32  Caucasian 0.64 0.80 0.71 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.58 191  macro avg 0.36 0.27 0.26 191  weighted avg 0.59 0.58 0.54 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.540 +/- 0.023 (in 3 folds) ROC-AUC (macro OvO): 0.514 +/- 0.015 (in 3 folds) au-PRC (weighted OvO): 0.613 +/- 0.032 (in 3 folds) au-PRC (macro OvO): 0.591 +/- 0.024 (in 3 folds) Accuracy: 0.620 +/- 0.041 (in 3 folds) MCC: 0.274 +/- 0.064 (in 3 folds) Global scores without abstention: Accuracy: 0.621 MCC: 0.261 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.591 +/- 0.033 (in 3 folds) MCC: 0.250 +/- 0.053 (in 3 folds) Unknown/abstention proportion: 0.047 +/- 0.013 (in 3 folds) Global scores with abstention: Accuracy: 0.592 MCC: 0.237 Unknown/abstention proportion: 0.047 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.54 0.43 0.48 44  Asian 1.00 0.03 0.06 32  Caucasian 0.64 0.85 0.73 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.59 191  macro avg 0.44 0.26 0.25 191  weighted avg 0.66 0.59 0.54 191
,,,


lasso_multiclass,lasso_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.540 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.512 +/- 0.029 (in 3 folds) au-PRC (weighted OvO): 0.620 +/- 0.019 (in 3 folds) au-PRC (macro OvO): 0.598 +/- 0.011 (in 3 folds) Accuracy: 0.599 +/- 0.010 (in 3 folds) MCC: 0.280 +/- 0.046 (in 3 folds) Global scores without abstention: Accuracy: 0.599 MCC: 0.242 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.571 +/- 0.017 (in 3 folds) MCC: 0.258 +/- 0.037 (in 3 folds) Unknown/abstention proportion: 0.047 +/- 0.013 (in 3 folds) Global scores with abstention: Accuracy: 0.571 MCC: 0.224 Unknown/abstention proportion: 0.047 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.49 0.52 0.51 44  Asian 0.67 0.06 0.11 32  Caucasian 0.64 0.77 0.70 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.57 191  macro avg 0.36 0.27 0.26 191  weighted avg 0.59 0.57 0.53 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.540 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.512 +/- 0.029 (in 3 folds) au-PRC (weighted OvO): 0.620 +/- 0.019 (in 3 folds) au-PRC (macro OvO): 0.598 +/- 0.011 (in 3 folds) Accuracy: 0.611 +/- 0.029 (in 3 folds) MCC: 0.248 +/- 0.136 (in 3 folds) Global scores without abstention: Accuracy: 0.610 MCC: 0.241 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.583 +/- 0.033 (in 3 folds) MCC: 0.229 +/- 0.120 (in 3 folds) Unknown/abstention proportion: 0.047 +/- 0.013 (in 3 folds) Global scores with abstention: Accuracy: 0.581 MCC: 0.221 Unknown/abstention proportion: 0.047 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.62 0.41 0.49 44  Asian 0.11 0.03 0.05 32  Caucasian 0.64 0.84 0.73 109 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.58 191  macro avg 0.27 0.26 0.25 191  weighted avg 0.53 0.58 0.54 191
,


---

# GeneLocus.BCR, TargetObsColumnEnum.age_group_healthy_only trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
linearsvm_ovr,0.537 +/- 0.058 (in 3 folds),0.534 +/- 0.056 (in 3 folds),0.626 +/- 0.063 (in 3 folds),0.626 +/- 0.062 (in 3 folds),0.215 +/- 0.030 (in 3 folds),0.066 +/- 0.016 (in 3 folds),0.215,0.053,0.212 +/- 0.028 (in 3 folds),0.066 +/- 0.017 (in 3 folds),0.022 +/- 0.000 (in 2 folds),0.212,0.051,0.015,Unknown,130.0,2.0,132.0,0.015152,True,0.603 +/- 0.000 (in 1 folds),0.594 +/- 0.000 (in 1 folds),0.699 +/- 0.000 (in 1 folds),0.695 +/- 0.000 (in 1 folds)
dummy_stratified,0.536 +/- 0.026 (in 3 folds),0.535 +/- 0.030 (in 3 folds),0.549 +/- 0.018 (in 3 folds),0.549 +/- 0.018 (in 3 folds),0.222 +/- 0.043 (in 3 folds),0.080 +/- 0.049 (in 3 folds),0.22,0.065,0.206 +/- 0.034 (in 3 folds),0.068 +/- 0.040 (in 3 folds),0.102 +/- 0.040 (in 2 folds),0.205,0.057,0.068,Unknown,123.0,9.0,132.0,0.068182,True,0.507 +/- 0.000 (in 1 folds),0.501 +/- 0.000 (in 1 folds),0.529 +/- 0.000 (in 1 folds),0.529 +/- 0.000 (in 1 folds)
lasso_cv,0.533 +/- 0.041 (in 3 folds),0.530 +/- 0.040 (in 3 folds),0.614 +/- 0.045 (in 3 folds),0.614 +/- 0.043 (in 3 folds),0.214 +/- 0.020 (in 3 folds),0.108 +/- 0.038 (in 3 folds),0.213,0.06,0.205 +/- 0.013 (in 3 folds),0.095 +/- 0.031 (in 3 folds),0.039 +/- 0.030 (in 3 folds),0.205,0.057,0.038,Unknown,127.0,5.0,132.0,0.037879,True,,,,
lasso_multiclass,0.529 +/- 0.030 (in 3 folds),0.523 +/- 0.036 (in 3 folds),0.628 +/- 0.036 (in 3 folds),0.624 +/- 0.041 (in 3 folds),0.241 +/- 0.053 (in 3 folds),0.110 +/- 0.051 (in 3 folds),0.227,0.088,0.188 +/- 0.039 (in 3 folds),0.084 +/- 0.016 (in 3 folds),0.267 +/- 0.347 (in 2 folds),0.189,0.077,0.167,Unknown,110.0,22.0,132.0,0.166667,False,0.562 +/- 0.000 (in 1 folds),0.565 +/- 0.000 (in 1 folds),0.650 +/- 0.000 (in 1 folds),0.651 +/- 0.000 (in 1 folds)
xgboost,0.525 +/- 0.053 (in 3 folds),0.523 +/- 0.049 (in 3 folds),0.584 +/- 0.074 (in 3 folds),0.582 +/- 0.068 (in 3 folds),0.235 +/- 0.011 (in 3 folds),0.007 +/- 0.132 (in 3 folds),0.239,0.092,0.168 +/- 0.107 (in 3 folds),0.052 +/- 0.048 (in 3 folds),0.298 +/- 0.435 (in 3 folds),0.167,0.059,0.303,Unknown,92.0,40.0,132.0,0.30303,True,,,,
rf_multiclass,0.517 +/- 0.039 (in 3 folds),0.517 +/- 0.045 (in 3 folds),0.584 +/- 0.019 (in 3 folds),0.585 +/- 0.023 (in 3 folds),0.228 +/- 0.036 (in 3 folds),0.076 +/- 0.018 (in 3 folds),0.229,0.069,0.226 +/- 0.037 (in 3 folds),0.076 +/- 0.018 (in 3 folds),0.022 +/- 0.000 (in 1 folds),0.227,0.065,0.008,Unknown,131.0,1.0,132.0,0.007576,True,0.535 +/- 0.031 (in 2 folds),0.539 +/- 0.033 (in 2 folds),0.587 +/- 0.026 (in 2 folds),0.591 +/- 0.028 (in 2 folds)
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.372 +/- 0.176 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.241,0.131,0.101 +/- 0.064 (in 3 folds),0.048 +/- 0.043 (in 3 folds),0.857 +/- 0.080 (in 2 folds),0.098,0.027,0.591,Unknown,54.0,78.0,132.0,0.590909,True,0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds)
elasticnet_cv,0.366 +/- 0.319 (in 3 folds),0.365 +/- 0.318 (in 3 folds),0.560 +/- 0.131 (in 3 folds),0.562 +/- 0.130 (in 3 folds),0.305 +/- 0.169 (in 3 folds),0.088 +/- 0.076 (in 3 folds),0.221,0.06,0.146 +/- 0.089 (in 3 folds),0.096 +/- 0.030 (in 3 folds),0.336 +/- 0.500 (in 3 folds),0.144,0.043,0.348,Unknown,86.0,46.0,132.0,0.348485,True,,,,
ridge_cv,0.355 +/- 0.310 (in 3 folds),0.354 +/- 0.309 (in 3 folds),0.530 +/- 0.128 (in 3 folds),0.530 +/- 0.124 (in 3 folds),0.372 +/- 0.176 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.241,0.131,0.101 +/- 0.064 (in 3 folds),0.048 +/- 0.043 (in 3 folds),0.857 +/- 0.080 (in 2 folds),0.098,0.027,0.591,Unknown,54.0,78.0,132.0,0.590909,True,0.576 +/- 0.000 (in 1 folds),0.563 +/- 0.000 (in 1 folds),0.670 +/- 0.000 (in 1 folds),0.663 +/- 0.000 (in 1 folds)
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
linearsvm_ovr,0.537 +/- 0.058 (in 3 folds),0.534 +/- 0.056 (in 3 folds),0.626 +/- 0.063 (in 3 folds),0.626 +/- 0.062 (in 3 folds),0.215 +/- 0.030 (in 3 folds),0.066 +/- 0.016 (in 3 folds),0.215,0.053,0.212 +/- 0.028 (in 3 folds),0.066 +/- 0.017 (in 3 folds),0.022 +/- 0.000 (in 2 folds),0.212,0.051,0.015,Unknown,130,2,132,0.015152,True,0.603 +/- 0.000 (in 1 folds),0.594 +/- 0.000 (in 1 folds),0.699 +/- 0.000 (in 1 folds),0.695 +/- 0.000 (in 1 folds)
dummy_stratified,0.536 +/- 0.026 (in 3 folds),0.535 +/- 0.030 (in 3 folds),0.549 +/- 0.018 (in 3 folds),0.549 +/- 0.018 (in 3 folds),0.222 +/- 0.043 (in 3 folds),0.080 +/- 0.049 (in 3 folds),0.22,0.065,0.206 +/- 0.034 (in 3 folds),0.068 +/- 0.040 (in 3 folds),0.102 +/- 0.040 (in 2 folds),0.205,0.057,0.068,Unknown,123,9,132,0.068182,True,0.507 +/- 0.000 (in 1 folds),0.501 +/- 0.000 (in 1 folds),0.529 +/- 0.000 (in 1 folds),0.529 +/- 0.000 (in 1 folds)
lasso_cv,0.533 +/- 0.041 (in 3 folds),0.530 +/- 0.040 (in 3 folds),0.614 +/- 0.045 (in 3 folds),0.614 +/- 0.043 (in 3 folds),0.214 +/- 0.020 (in 3 folds),0.108 +/- 0.038 (in 3 folds),0.213,0.06,0.205 +/- 0.013 (in 3 folds),0.095 +/- 0.031 (in 3 folds),0.039 +/- 0.030 (in 3 folds),0.205,0.057,0.038,Unknown,127,5,132,0.037879,True,,,,
lasso_multiclass,0.529 +/- 0.030 (in 3 folds),0.523 +/- 0.036 (in 3 folds),0.628 +/- 0.036 (in 3 folds),0.624 +/- 0.041 (in 3 folds),0.241 +/- 0.053 (in 3 folds),0.110 +/- 0.051 (in 3 folds),0.227,0.088,0.188 +/- 0.039 (in 3 folds),0.084 +/- 0.016 (in 3 folds),0.267 +/- 0.347 (in 2 folds),0.189,0.077,0.167,Unknown,110,22,132,0.166667,False,0.562 +/- 0.000 (in 1 folds),0.565 +/- 0.000 (in 1 folds),0.650 +/- 0.000 (in 1 folds),0.651 +/- 0.000 (in 1 folds)
xgboost,0.525 +/- 0.053 (in 3 folds),0.523 +/- 0.049 (in 3 folds),0.584 +/- 0.074 (in 3 folds),0.582 +/- 0.068 (in 3 folds),0.235 +/- 0.011 (in 3 folds),0.007 +/- 0.132 (in 3 folds),0.239,0.092,0.168 +/- 0.107 (in 3 folds),0.052 +/- 0.048 (in 3 folds),0.298 +/- 0.435 (in 3 folds),0.167,0.059,0.303,Unknown,92,40,132,0.30303,True,,,,
rf_multiclass,0.517 +/- 0.039 (in 3 folds),0.517 +/- 0.045 (in 3 folds),0.584 +/- 0.019 (in 3 folds),0.585 +/- 0.023 (in 3 folds),0.228 +/- 0.036 (in 3 folds),0.076 +/- 0.018 (in 3 folds),0.229,0.069,0.226 +/- 0.037 (in 3 folds),0.076 +/- 0.018 (in 3 folds),0.022 +/- 0.000 (in 1 folds),0.227,0.065,0.008,Unknown,131,1,132,0.007576,True,0.535 +/- 0.031 (in 2 folds),0.539 +/- 0.033 (in 2 folds),0.587 +/- 0.026 (in 2 folds),0.591 +/- 0.028 (in 2 folds)
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.372 +/- 0.176 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.241,0.131,0.101 +/- 0.064 (in 3 folds),0.048 +/- 0.043 (in 3 folds),0.857 +/- 0.080 (in 2 folds),0.098,0.027,0.591,Unknown,54,78,132,0.590909,True,0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds)
elasticnet_cv,0.366 +/- 0.319 (in 3 folds),0.365 +/- 0.318 (in 3 folds),0.560 +/- 0.131 (in 3 folds),0.562 +/- 0.130 (in 3 folds),0.305 +/- 0.169 (in 3 folds),0.088 +/- 0.076 (in 3 folds),0.221,0.06,0.146 +/- 0.089 (in 3 folds),0.096 +/- 0.030 (in 3 folds),0.336 +/- 0.500 (in 3 folds),0.144,0.043,0.348,Unknown,86,46,132,0.348485,True,,,,
ridge_cv,0.355 +/- 0.310 (in 3 folds),0.354 +/- 0.309 (in 3 folds),0.530 +/- 0.128 (in 3 folds),0.530 +/- 0.124 (in 3 folds),0.372 +/- 0.176 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.241,0.131,0.101 +/- 0.064 (in 3 folds),0.048 +/- 0.043 (in 3 folds),0.857 +/- 0.080 (in 2 folds),0.098,0.027,0.591,Unknown,54,78,132,0.590909,True,0.576 +/- 0.000 (in 1 folds),0.563 +/- 0.000 (in 1 folds),0.670 +/- 0.000 (in 1 folds),0.663 +/- 0.000 (in 1 folds)


linearsvm_ovr,dummy_stratified,lasso_cv,lasso_multiclass
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.537 +/- 0.058 (in 3 folds) ROC-AUC (macro OvO): 0.534 +/- 0.056 (in 3 folds) au-PRC (weighted OvO): 0.626 +/- 0.063 (in 3 folds) au-PRC (macro OvO): 0.626 +/- 0.062 (in 3 folds) Accuracy: 0.215 +/- 0.030 (in 3 folds) MCC: 0.066 +/- 0.016 (in 3 folds) Global scores without abstention: Accuracy: 0.215 MCC: 0.053 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.212 +/- 0.028 (in 3 folds) MCC: 0.066 +/- 0.017 (in 3 folds) Unknown/abstention proportion: 0.022 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.603 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.594 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.699 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.695 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.212 MCC: 0.051 Unknown/abstention proportion: 0.015 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.25 0.16 0.20 25  30-40 0.12 0.05 0.07 20  40-50 0.14 0.17 0.15 18  50-60 0.19 0.37 0.25 27  60-70 0.29 0.33 0.31 15  70-80 0.00 0.00 0.00 3  <20 0.36 0.21 0.26 24  Unknown 0.00 0.00 0.00 0  accuracy 0.21 132  macro avg 0.17 0.16 0.16 132 weighted avg 0.22 0.21 0.20 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.536 +/- 0.026 (in 3 folds) ROC-AUC (macro OvO): 0.535 +/- 0.030 (in 3 folds) au-PRC (weighted OvO): 0.549 +/- 0.018 (in 3 folds) au-PRC (macro OvO): 0.549 +/- 0.018 (in 3 folds) Accuracy: 0.222 +/- 0.043 (in 3 folds) MCC: 0.080 +/- 0.049 (in 3 folds) Global scores without abstention: Accuracy: 0.220 MCC: 0.065 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.507 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.501 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.529 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.529 +/- 0.000 (in 1 folds) Accuracy: 0.206 +/- 0.034 (in 3 folds) MCC: 0.068 +/- 0.040 (in 3 folds) Unknown/abstention proportion: 0.102 +/- 0.040 (in 2 folds) Global scores with abstention: Accuracy: 0.205 MCC: 0.057 Unknown/abstention proportion: 0.068 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.26 0.20 0.23 25  30-40 0.12 0.10 0.11 20  40-50 0.50 0.33 0.40 18  50-60 0.26 0.30 0.28 27  60-70 0.05 0.07 0.05 15  70-80 0.00 0.00 0.00 3  <20 0.23 0.21 0.22 24  Unknown 0.00 0.00 0.00 0  accuracy 0.20 132  macro avg 0.18 0.15 0.16 132 weighted avg 0.24 0.20 0.22 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.533 +/- 0.041 (in 3 folds) ROC-AUC (macro OvO): 0.530 +/- 0.040 (in 3 folds) au-PRC (weighted OvO): 0.614 +/- 0.045 (in 3 folds) au-PRC (macro OvO): 0.614 +/- 0.043 (in 3 folds) Accuracy: 0.214 +/- 0.020 (in 3 folds) MCC: 0.108 +/- 0.038 (in 3 folds) Global scores without abstention: Accuracy: 0.213 MCC: 0.060 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.205 +/- 0.013 (in 3 folds) MCC: 0.095 +/- 0.031 (in 3 folds) Unknown/abstention proportion: 0.039 +/- 0.030 (in 3 folds) Global scores with abstention: Accuracy: 0.205 MCC: 0.057 Unknown/abstention proportion: 0.038 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.29 0.20 0.24 25  30-40 0.20 0.05 0.08 20  40-50 0.06 0.06 0.06 18  50-60 0.20 0.22 0.21 27  60-70 0.19 0.40 0.26 15  70-80 0.00 0.00 0.00 3  <20 0.32 0.33 0.33 24  Unknown 0.00 0.00 0.00 0  accuracy 0.20 132  macro avg 0.16 0.16 0.15 132 weighted avg 0.21 0.20 0.20 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.529 +/- 0.030 (in 3 folds) ROC-AUC (macro OvO): 0.523 +/- 0.036 (in 3 folds) au-PRC (weighted OvO): 0.628 +/- 0.036 (in 3 folds) au-PRC (macro OvO): 0.624 +/- 0.041 (in 3 folds) Accuracy: 0.241 +/- 0.053 (in 3 folds) MCC: 0.110 +/- 0.051 (in 3 folds) Global scores without abstention: Accuracy: 0.227 MCC: 0.088 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.562 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.565 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.650 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.651 +/- 0.000 (in 1 folds) Accuracy: 0.188 +/- 0.039 (in 3 folds) MCC: 0.084 +/- 0.016 (in 3 folds) Unknown/abstention proportion: 0.267 +/- 0.347 (in 2 folds) Global scores with abstention: Accuracy: 0.189 MCC: 0.077 Unknown/abstention proportion: 0.167 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.60 0.24 0.34 25  30-40 0.14 0.05 0.07 20  40-50 0.09 0.11 0.10 18  50-60 0.35 0.26 0.30 27  60-70 0.17 0.40 0.24 15  70-80 0.00 0.00 0.00 3  <20 0.23 0.12 0.16 24  Unknown 0.00 0.00 0.00 0  accuracy 0.19 132  macro avg 0.20 0.15 0.15 132 weighted avg 0.28 0.19 0.21 132
,,,


xgboost,rf_multiclass,dummy_most_frequent,elasticnet_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.525 +/- 0.053 (in 3 folds) ROC-AUC (macro OvO): 0.523 +/- 0.049 (in 3 folds) au-PRC (weighted OvO): 0.584 +/- 0.074 (in 3 folds) au-PRC (macro OvO): 0.582 +/- 0.068 (in 3 folds) Accuracy: 0.235 +/- 0.011 (in 3 folds) MCC: 0.007 +/- 0.132 (in 3 folds) Global scores without abstention: Accuracy: 0.239 MCC: 0.092 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.168 +/- 0.107 (in 3 folds) MCC: 0.052 +/- 0.048 (in 3 folds) Unknown/abstention proportion: 0.298 +/- 0.435 (in 3 folds) Global scores with abstention: Accuracy: 0.167 MCC: 0.059 Unknown/abstention proportion: 0.303 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.23 0.12 0.16 25  30-40 0.10 0.05 0.07 20  40-50 0.11 0.11 0.11 18  50-60 0.32 0.22 0.26 27  60-70 0.33 0.20 0.25 15  70-80 0.00 0.00 0.00 3  <20 0.30 0.29 0.30 24  Unknown 0.00 0.00 0.00 0  accuracy 0.17 132  macro avg 0.17 0.12 0.14 132 weighted avg 0.23 0.17 0.19 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.517 +/- 0.039 (in 3 folds) ROC-AUC (macro OvO): 0.517 +/- 0.045 (in 3 folds) au-PRC (weighted OvO): 0.584 +/- 0.019 (in 3 folds) au-PRC (macro OvO): 0.585 +/- 0.023 (in 3 folds) Accuracy: 0.228 +/- 0.036 (in 3 folds) MCC: 0.076 +/- 0.018 (in 3 folds) Global scores without abstention: Accuracy: 0.229 MCC: 0.069 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.535 +/- 0.031 (in 2 folds) ROC-AUC (macro OvO): 0.539 +/- 0.033 (in 2 folds) au-PRC (weighted OvO): 0.587 +/- 0.026 (in 2 folds) au-PRC (macro OvO): 0.591 +/- 0.028 (in 2 folds) Accuracy: 0.226 +/- 0.037 (in 3 folds) MCC: 0.076 +/- 0.018 (in 3 folds) Unknown/abstention proportion: 0.022 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.227 MCC: 0.065 Unknown/abstention proportion: 0.008 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.38 0.12 0.18 25  30-40 0.10 0.05 0.07 20  40-50 0.06 0.06 0.06 18  50-60 0.23 0.59 0.33 27  60-70 0.33 0.27 0.30 15  70-80 0.00 0.00 0.00 3  <20 0.36 0.21 0.26 24  Unknown 0.00 0.00 0.00 0  accuracy 0.23 132  macro avg 0.18 0.16 0.15 132 weighted avg 0.24 0.23 0.20 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 3 folds) Accuracy: 0.372 +/- 0.176 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.241 MCC: 0.131 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.101 +/- 0.064 (in 3 folds) MCC: 0.048 +/- 0.043 (in 3 folds) Unknown/abstention proportion: 0.857 +/- 0.080 (in 2 folds) ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.098 MCC: 0.027 Unknown/abstention proportion: 0.591 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.00 0.00 0.00 25  30-40 0.00 0.00 0.00 20  40-50 0.00 0.00 0.00 18  50-60 0.22 0.41 0.29 27  60-70 0.50 0.13 0.21 15  70-80 0.00 0.00 0.00 3  <20 0.00 0.00 0.00 24  Unknown 0.00 0.00 0.00 0  accuracy 0.10 132  macro avg 0.09 0.07 0.06 132 weighted avg 0.10 0.10 0.08 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.366 +/- 0.319 (in 3 folds) ROC-AUC (macro OvO): 0.365 +/- 0.318 (in 3 folds) au-PRC (weighted OvO): 0.560 +/- 0.131 (in 3 folds) au-PRC (macro OvO): 0.562 +/- 0.130 (in 3 folds) Accuracy: 0.305 +/- 0.169 (in 3 folds) MCC: 0.088 +/- 0.076 (in 3 folds) Global scores without abstention: Accuracy: 0.221 MCC: 0.060 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.146 +/- 0.089 (in 3 folds) MCC: 0.096 +/- 0.030 (in 3 folds) Unknown/abstention proportion: 0.336 +/- 0.500 (in 3 folds) Global scores with abstention: Accuracy: 0.144 MCC: 0.043 Unknown/abstention proportion: 0.348 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.28 0.20 0.23 25  30-40 0.00 0.00 0.00 20  40-50 0.00 0.00 0.00 18  50-60 0.18 0.22 0.20 27  60-70 0.17 0.33 0.23 15  70-80 0.00 0.00 0.00 3  <20 0.60 0.12 0.21 24  Unknown 0.00 0.00 0.00 0  accuracy 0.14 132  macro avg 0.15 0.11 0.11 132 weighted avg 0.22 0.14 0.15 132
,,,


ridge_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.355 +/- 0.310 (in 3 folds) ROC-AUC (macro OvO): 0.354 +/- 0.309 (in 3 folds) au-PRC (weighted OvO): 0.530 +/- 0.128 (in 3 folds) au-PRC (macro OvO): 0.530 +/- 0.124 (in 3 folds) Accuracy: 0.372 +/- 0.176 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.241 MCC: 0.131 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.101 +/- 0.064 (in 3 folds) MCC: 0.048 +/- 0.043 (in 3 folds) Unknown/abstention proportion: 0.857 +/- 0.080 (in 2 folds) ROC-AUC (weighted OvO): 0.576 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.563 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.670 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.663 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.098 MCC: 0.027 Unknown/abstention proportion: 0.591 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.00 0.00 0.00 25  30-40 0.00 0.00 0.00 20  40-50 0.00 0.00 0.00 18  50-60 0.22 0.41 0.29 27  60-70 0.50 0.13 0.21 15  70-80 0.00 0.00 0.00 3  <20 0.00 0.00 0.00 24  Unknown 0.00 0.00 0.00 0  accuracy 0.10 132  macro avg 0.09 0.07 0.06 132 weighted avg 0.10 0.10 0.08 132


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_cv,0.558 +/- 0.074 (in 3 folds),0.552 +/- 0.078 (in 3 folds),0.601 +/- 0.066 (in 3 folds),0.595 +/- 0.063 (in 3 folds),0.180 +/- 0.032 (in 3 folds),0.069 +/- 0.050 (in 3 folds),0.18,0.007,0.173 +/- 0.036 (in 3 folds),0.062 +/- 0.054 (in 3 folds),0.065 +/- 0.006 (in 2 folds),0.643 +/- 0.000 (in 1 folds),0.642 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds),0.666 +/- 0.000 (in 1 folds),0.173,0.005,0.042,Unknown,183.0,8.0,191.0,0.041885,True
lasso_cv.decision_thresholds_tuned,0.558 +/- 0.074 (in 3 folds),0.552 +/- 0.078 (in 3 folds),0.601 +/- 0.066 (in 3 folds),0.595 +/- 0.063 (in 3 folds),0.199 +/- 0.060 (in 3 folds),0.092 +/- 0.084 (in 3 folds),0.202,0.042,0.192 +/- 0.067 (in 3 folds),0.091 +/- 0.085 (in 3 folds),0.065 +/- 0.006 (in 2 folds),0.643 +/- 0.000 (in 1 folds),0.642 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds),0.666 +/- 0.000 (in 1 folds),0.194,0.039,0.042,Unknown,183.0,8.0,191.0,0.041885,True
linearsvm_ovr,0.555 +/- 0.073 (in 3 folds),0.552 +/- 0.077 (in 3 folds),0.613 +/- 0.060 (in 3 folds),0.607 +/- 0.060 (in 3 folds),0.213 +/- 0.096 (in 3 folds),0.074 +/- 0.105 (in 3 folds),0.214,0.046,0.208 +/- 0.097 (in 3 folds),0.072 +/- 0.106 (in 3 folds),0.069 +/- 0.000 (in 1 folds),0.589 +/- 0.061 (in 2 folds),0.590 +/- 0.058 (in 2 folds),0.643 +/- 0.044 (in 2 folds),0.638 +/- 0.038 (in 2 folds),0.209,0.043,0.021,Unknown,187.0,4.0,191.0,0.020942,True
linearsvm_ovr.decision_thresholds_tuned,0.555 +/- 0.073 (in 3 folds),0.552 +/- 0.077 (in 3 folds),0.613 +/- 0.060 (in 3 folds),0.607 +/- 0.060 (in 3 folds),0.218 +/- 0.021 (in 3 folds),0.124 +/- 0.023 (in 3 folds),0.219,0.074,0.214 +/- 0.027 (in 3 folds),0.125 +/- 0.022 (in 3 folds),0.069 +/- 0.000 (in 1 folds),0.589 +/- 0.061 (in 2 folds),0.590 +/- 0.058 (in 2 folds),0.643 +/- 0.044 (in 2 folds),0.638 +/- 0.038 (in 2 folds),0.215,0.072,0.021,Unknown,187.0,4.0,191.0,0.020942,True
elasticnet_cv,0.544 +/- 0.092 (in 3 folds),0.539 +/- 0.095 (in 3 folds),0.607 +/- 0.062 (in 3 folds),0.604 +/- 0.056 (in 3 folds),0.108 +/- 0.099 (in 3 folds),0.056 +/- 0.051 (in 3 folds),0.157,-0.008,0.105 +/- 0.098 (in 3 folds),0.036 +/- 0.064 (in 3 folds),0.487 +/- 0.603 (in 2 folds),0.645 +/- 0.000 (in 1 folds),0.644 +/- 0.000 (in 1 folds),0.678 +/- 0.000 (in 1 folds),0.668 +/- 0.000 (in 1 folds),0.11,-0.021,0.298,Unknown,134.0,57.0,191.0,0.298429,True
elasticnet_cv.decision_thresholds_tuned,0.544 +/- 0.092 (in 3 folds),0.539 +/- 0.095 (in 3 folds),0.607 +/- 0.062 (in 3 folds),0.604 +/- 0.056 (in 3 folds),0.210 +/- 0.054 (in 3 folds),0.081 +/- 0.100 (in 3 folds),0.216,0.065,0.146 +/- 0.126 (in 3 folds),0.068 +/- 0.112 (in 3 folds),0.487 +/- 0.603 (in 2 folds),0.645 +/- 0.000 (in 1 folds),0.644 +/- 0.000 (in 1 folds),0.678 +/- 0.000 (in 1 folds),0.668 +/- 0.000 (in 1 folds),0.152,0.035,0.298,Unknown,134.0,57.0,191.0,0.298429,True
lasso_multiclass,0.544 +/- 0.066 (in 3 folds),0.541 +/- 0.070 (in 3 folds),0.600 +/- 0.053 (in 3 folds),0.601 +/- 0.056 (in 3 folds),0.201 +/- 0.010 (in 3 folds),0.065 +/- 0.032 (in 3 folds),0.203,0.052,0.168 +/- 0.055 (in 3 folds),0.056 +/- 0.036 (in 3 folds),0.254 +/- 0.262 (in 2 folds),0.619 +/- 0.000 (in 1 folds),0.621 +/- 0.000 (in 1 folds),0.648 +/- 0.000 (in 1 folds),0.649 +/- 0.000 (in 1 folds),0.168,0.042,0.173,Unknown,158.0,33.0,191.0,0.172775,False
lasso_multiclass.decision_thresholds_tuned,0.544 +/- 0.066 (in 3 folds),0.541 +/- 0.070 (in 3 folds),0.600 +/- 0.053 (in 3 folds),0.601 +/- 0.056 (in 3 folds),0.200 +/- 0.048 (in 3 folds),0.081 +/- 0.065 (in 3 folds),0.209,0.05,0.172 +/- 0.081 (in 3 folds),0.073 +/- 0.073 (in 3 folds),0.254 +/- 0.262 (in 2 folds),0.619 +/- 0.000 (in 1 folds),0.621 +/- 0.000 (in 1 folds),0.648 +/- 0.000 (in 1 folds),0.649 +/- 0.000 (in 1 folds),0.173,0.038,0.173,Unknown,158.0,33.0,191.0,0.172775,True
ridge_cv,0.537 +/- 0.015 (in 3 folds),0.536 +/- 0.018 (in 3 folds),0.608 +/- 0.021 (in 3 folds),0.614 +/- 0.025 (in 3 folds),0.091 +/- 0.084 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.108,-0.051,0.045 +/- 0.055 (in 3 folds),-0.015 +/- 0.015 (in 3 folds),0.867 +/- 0.066 (in 2 folds),0.531 +/- 0.000 (in 1 folds),0.533 +/- 0.000 (in 1 folds),0.585 +/- 0.000 (in 1 folds),0.585 +/- 0.000 (in 1 folds),0.047,-0.061,0.565,Unknown,83.0,108.0,191.0,0.565445,True
ridge_cv.decision_thresholds_tuned,0.537 +/- 0.015 (in 3 folds),0.536 +/- 0.018 (in 3 folds),0.608 +/- 0.021 (in 3 folds),0.614 +/- 0.025 (in 3 folds),0.131 +/- 0.118 (in 3 folds),0.039 +/- 0.068 (in 3 folds),0.205,0.081,0.086 +/- 0.124 (in 3 folds),0.025 +/- 0.081 (in 3 folds),0.867 +/- 0.066 (in 2 folds),0.531 +/- 0.000 (in 1 folds),0.533 +/- 0.000 (in 1 folds),0.585 +/- 0.000 (in 1 folds),0.585 +/- 0.000 (in 1 folds),0.089,0.008,0.565,Unknown,83.0,108.0,191.0,0.565445,True

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_cv,0.558 +/- 0.074 (in 3 folds),0.552 +/- 0.078 (in 3 folds),0.601 +/- 0.066 (in 3 folds),0.595 +/- 0.063 (in 3 folds),0.180 +/- 0.032 (in 3 folds),0.069 +/- 0.050 (in 3 folds),0.18,0.007,0.173 +/- 0.036 (in 3 folds),0.062 +/- 0.054 (in 3 folds),0.065 +/- 0.006 (in 2 folds),0.643 +/- 0.000 (in 1 folds),0.642 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds),0.666 +/- 0.000 (in 1 folds),0.173,0.005,0.042,Unknown,183,8,191,0.041885,True
lasso_cv.decision_thresholds_tuned,0.558 +/- 0.074 (in 3 folds),0.552 +/- 0.078 (in 3 folds),0.601 +/- 0.066 (in 3 folds),0.595 +/- 0.063 (in 3 folds),0.199 +/- 0.060 (in 3 folds),0.092 +/- 0.084 (in 3 folds),0.202,0.042,0.192 +/- 0.067 (in 3 folds),0.091 +/- 0.085 (in 3 folds),0.065 +/- 0.006 (in 2 folds),0.643 +/- 0.000 (in 1 folds),0.642 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds),0.666 +/- 0.000 (in 1 folds),0.194,0.039,0.042,Unknown,183,8,191,0.041885,True
linearsvm_ovr,0.555 +/- 0.073 (in 3 folds),0.552 +/- 0.077 (in 3 folds),0.613 +/- 0.060 (in 3 folds),0.607 +/- 0.060 (in 3 folds),0.213 +/- 0.096 (in 3 folds),0.074 +/- 0.105 (in 3 folds),0.214,0.046,0.208 +/- 0.097 (in 3 folds),0.072 +/- 0.106 (in 3 folds),0.069 +/- 0.000 (in 1 folds),0.589 +/- 0.061 (in 2 folds),0.590 +/- 0.058 (in 2 folds),0.643 +/- 0.044 (in 2 folds),0.638 +/- 0.038 (in 2 folds),0.209,0.043,0.021,Unknown,187,4,191,0.020942,True
linearsvm_ovr.decision_thresholds_tuned,0.555 +/- 0.073 (in 3 folds),0.552 +/- 0.077 (in 3 folds),0.613 +/- 0.060 (in 3 folds),0.607 +/- 0.060 (in 3 folds),0.218 +/- 0.021 (in 3 folds),0.124 +/- 0.023 (in 3 folds),0.219,0.074,0.214 +/- 0.027 (in 3 folds),0.125 +/- 0.022 (in 3 folds),0.069 +/- 0.000 (in 1 folds),0.589 +/- 0.061 (in 2 folds),0.590 +/- 0.058 (in 2 folds),0.643 +/- 0.044 (in 2 folds),0.638 +/- 0.038 (in 2 folds),0.215,0.072,0.021,Unknown,187,4,191,0.020942,True
elasticnet_cv,0.544 +/- 0.092 (in 3 folds),0.539 +/- 0.095 (in 3 folds),0.607 +/- 0.062 (in 3 folds),0.604 +/- 0.056 (in 3 folds),0.108 +/- 0.099 (in 3 folds),0.056 +/- 0.051 (in 3 folds),0.157,-0.008,0.105 +/- 0.098 (in 3 folds),0.036 +/- 0.064 (in 3 folds),0.487 +/- 0.603 (in 2 folds),0.645 +/- 0.000 (in 1 folds),0.644 +/- 0.000 (in 1 folds),0.678 +/- 0.000 (in 1 folds),0.668 +/- 0.000 (in 1 folds),0.11,-0.021,0.298,Unknown,134,57,191,0.298429,True
elasticnet_cv.decision_thresholds_tuned,0.544 +/- 0.092 (in 3 folds),0.539 +/- 0.095 (in 3 folds),0.607 +/- 0.062 (in 3 folds),0.604 +/- 0.056 (in 3 folds),0.210 +/- 0.054 (in 3 folds),0.081 +/- 0.100 (in 3 folds),0.216,0.065,0.146 +/- 0.126 (in 3 folds),0.068 +/- 0.112 (in 3 folds),0.487 +/- 0.603 (in 2 folds),0.645 +/- 0.000 (in 1 folds),0.644 +/- 0.000 (in 1 folds),0.678 +/- 0.000 (in 1 folds),0.668 +/- 0.000 (in 1 folds),0.152,0.035,0.298,Unknown,134,57,191,0.298429,True
lasso_multiclass,0.544 +/- 0.066 (in 3 folds),0.541 +/- 0.070 (in 3 folds),0.600 +/- 0.053 (in 3 folds),0.601 +/- 0.056 (in 3 folds),0.201 +/- 0.010 (in 3 folds),0.065 +/- 0.032 (in 3 folds),0.203,0.052,0.168 +/- 0.055 (in 3 folds),0.056 +/- 0.036 (in 3 folds),0.254 +/- 0.262 (in 2 folds),0.619 +/- 0.000 (in 1 folds),0.621 +/- 0.000 (in 1 folds),0.648 +/- 0.000 (in 1 folds),0.649 +/- 0.000 (in 1 folds),0.168,0.042,0.173,Unknown,158,33,191,0.172775,False
lasso_multiclass.decision_thresholds_tuned,0.544 +/- 0.066 (in 3 folds),0.541 +/- 0.070 (in 3 folds),0.600 +/- 0.053 (in 3 folds),0.601 +/- 0.056 (in 3 folds),0.200 +/- 0.048 (in 3 folds),0.081 +/- 0.065 (in 3 folds),0.209,0.05,0.172 +/- 0.081 (in 3 folds),0.073 +/- 0.073 (in 3 folds),0.254 +/- 0.262 (in 2 folds),0.619 +/- 0.000 (in 1 folds),0.621 +/- 0.000 (in 1 folds),0.648 +/- 0.000 (in 1 folds),0.649 +/- 0.000 (in 1 folds),0.173,0.038,0.173,Unknown,158,33,191,0.172775,True
ridge_cv,0.537 +/- 0.015 (in 3 folds),0.536 +/- 0.018 (in 3 folds),0.608 +/- 0.021 (in 3 folds),0.614 +/- 0.025 (in 3 folds),0.091 +/- 0.084 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.108,-0.051,0.045 +/- 0.055 (in 3 folds),-0.015 +/- 0.015 (in 3 folds),0.867 +/- 0.066 (in 2 folds),0.531 +/- 0.000 (in 1 folds),0.533 +/- 0.000 (in 1 folds),0.585 +/- 0.000 (in 1 folds),0.585 +/- 0.000 (in 1 folds),0.047,-0.061,0.565,Unknown,83,108,191,0.565445,True
ridge_cv.decision_thresholds_tuned,0.537 +/- 0.015 (in 3 folds),0.536 +/- 0.018 (in 3 folds),0.608 +/- 0.021 (in 3 folds),0.614 +/- 0.025 (in 3 folds),0.131 +/- 0.118 (in 3 folds),0.039 +/- 0.068 (in 3 folds),0.205,0.081,0.086 +/- 0.124 (in 3 folds),0.025 +/- 0.081 (in 3 folds),0.867 +/- 0.066 (in 2 folds),0.531 +/- 0.000 (in 1 folds),0.533 +/- 0.000 (in 1 folds),0.585 +/- 0.000 (in 1 folds),0.585 +/- 0.000 (in 1 folds),0.089,0.008,0.565,Unknown,83,108,191,0.565445,True


lasso_cv,lasso_cv.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.558 +/- 0.074 (in 3 folds) ROC-AUC (macro OvO): 0.552 +/- 0.078 (in 3 folds) au-PRC (weighted OvO): 0.601 +/- 0.066 (in 3 folds) au-PRC (macro OvO): 0.595 +/- 0.063 (in 3 folds) Accuracy: 0.180 +/- 0.032 (in 3 folds) MCC: 0.069 +/- 0.050 (in 3 folds) Global scores without abstention: Accuracy: 0.180 MCC: 0.007 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.173 +/- 0.036 (in 3 folds) MCC: 0.062 +/- 0.054 (in 3 folds) Unknown/abstention proportion: 0.065 +/- 0.006 (in 2 folds) ROC-AUC (weighted OvO): 0.643 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.642 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.677 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.666 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.173 MCC: 0.005 Unknown/abstention proportion: 0.042 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.20 0.23 0.21 35  30-40 0.00 0.00 0.00 23  40-50 0.20 0.14 0.17 28  50-60 0.15 0.21 0.17 39  60-70 0.16 0.22 0.19 27  70-80 0.00 0.00 0.00 4  <20 0.26 0.20 0.23 35  Unknown 0.00 0.00 0.00 0  accuracy 0.17 191  macro avg 0.12 0.12 0.12 191 weighted avg 0.17 0.17 0.17 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.558 +/- 0.074 (in 3 folds) ROC-AUC (macro OvO): 0.552 +/- 0.078 (in 3 folds) au-PRC (weighted OvO): 0.601 +/- 0.066 (in 3 folds) au-PRC (macro OvO): 0.595 +/- 0.063 (in 3 folds) Accuracy: 0.199 +/- 0.060 (in 3 folds) MCC: 0.092 +/- 0.084 (in 3 folds) Global scores without abstention: Accuracy: 0.202 MCC: 0.042 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.192 +/- 0.067 (in 3 folds) MCC: 0.091 +/- 0.085 (in 3 folds) Unknown/abstention proportion: 0.065 +/- 0.006 (in 2 folds) ROC-AUC (weighted OvO): 0.643 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.642 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.677 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.666 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.194 MCC: 0.039 Unknown/abstention proportion: 0.042 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.28 0.29 0.28 35  30-40 0.20 0.09 0.12 23  40-50 0.15 0.25 0.18 28  50-60 0.19 0.21 0.20 39  60-70 0.14 0.15 0.14 27  70-80 0.00 0.00 0.00 4  <20 0.35 0.17 0.23 35  Unknown 0.00 0.00 0.00 0  accuracy 0.19 191  macro avg 0.16 0.14 0.14 191 weighted avg 0.22 0.19 0.20 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.555 +/- 0.073 (in 3 folds) ROC-AUC (macro OvO): 0.552 +/- 0.077 (in 3 folds) au-PRC (weighted OvO): 0.613 +/- 0.060 (in 3 folds) au-PRC (macro OvO): 0.607 +/- 0.060 (in 3 folds) Accuracy: 0.213 +/- 0.096 (in 3 folds) MCC: 0.074 +/- 0.105 (in 3 folds) Global scores without abstention: Accuracy: 0.214 MCC: 0.046 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.589 +/- 0.061 (in 2 folds) ROC-AUC (macro OvO): 0.590 +/- 0.058 (in 2 folds) au-PRC (weighted OvO): 0.643 +/- 0.044 (in 2 folds) au-PRC (macro OvO): 0.638 +/- 0.038 (in 2 folds) Accuracy: 0.208 +/- 0.097 (in 3 folds) MCC: 0.072 +/- 0.106 (in 3 folds) Unknown/abstention proportion: 0.069 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.209 MCC: 0.043 Unknown/abstention proportion: 0.021 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.22 0.23 0.23 35  30-40 0.10 0.04 0.06 23  40-50 0.09 0.07 0.08 28  50-60 0.22 0.44 0.29 39  60-70 0.17 0.15 0.16 27  70-80 0.00 0.00 0.00 4  <20 0.44 0.23 0.30 35  Unknown 0.00 0.00 0.00 0  accuracy 0.21 191  macro avg 0.16 0.14 0.14 191 weighted avg 0.22 0.21 0.20 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.555 +/- 0.073 (in 3 folds) ROC-AUC (macro OvO): 0.552 +/- 0.077 (in 3 folds) au-PRC (weighted OvO): 0.613 +/- 0.060 (in 3 folds) au-PRC (macro OvO): 0.607 +/- 0.060 (in 3 folds) Accuracy: 0.218 +/- 0.021 (in 3 folds) MCC: 0.124 +/- 0.023 (in 3 folds) Global scores without abstention: Accuracy: 0.219 MCC: 0.074 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.589 +/- 0.061 (in 2 folds) ROC-AUC (macro OvO): 0.590 +/- 0.058 (in 2 folds) au-PRC (weighted OvO): 0.643 +/- 0.044 (in 2 folds) au-PRC (macro OvO): 0.638 +/- 0.038 (in 2 folds) Accuracy: 0.214 +/- 0.027 (in 3 folds) MCC: 0.125 +/- 0.022 (in 3 folds) Unknown/abstention proportion: 0.069 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.215 MCC: 0.072 Unknown/abstention proportion: 0.021 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.26 0.23 0.24 35  30-40 0.19 0.22 0.20 23  40-50 0.00 0.00 0.00 28  50-60 0.17 0.13 0.15 39  60-70 0.13 0.37 0.20 27  70-80 0.00 0.00 0.00 4  <20 0.57 0.37 0.45 35  Unknown 0.00 0.00 0.00 0  accuracy 0.21 191  macro avg 0.17 0.16 0.15 191 weighted avg 0.23 0.21 0.21 191
,,,


elasticnet_cv,elasticnet_cv.decision_thresholds_tuned,lasso_multiclass,lasso_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.544 +/- 0.092 (in 3 folds) ROC-AUC (macro OvO): 0.539 +/- 0.095 (in 3 folds) au-PRC (weighted OvO): 0.607 +/- 0.062 (in 3 folds) au-PRC (macro OvO): 0.604 +/- 0.056 (in 3 folds) Accuracy: 0.108 +/- 0.099 (in 3 folds) MCC: 0.056 +/- 0.051 (in 3 folds) Global scores without abstention: Accuracy: 0.157 MCC: -0.008 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.105 +/- 0.098 (in 3 folds) MCC: 0.036 +/- 0.064 (in 3 folds) Unknown/abstention proportion: 0.487 +/- 0.603 (in 2 folds) ROC-AUC (weighted OvO): 0.645 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.644 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.678 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.668 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.110 MCC: -0.021 Unknown/abstention proportion: 0.298 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.23 0.20 0.21 35  30-40 0.00 0.00 0.00 23  40-50 0.00 0.00 0.00 28  50-60 0.11 0.15 0.13 39  60-70 0.11 0.15 0.13 27  70-80 0.00 0.00 0.00 4  <20 0.40 0.11 0.18 35  Unknown 0.00 0.00 0.00 0  accuracy 0.11 191  macro avg 0.11 0.08 0.08 191 weighted avg 0.15 0.11 0.12 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.544 +/- 0.092 (in 3 folds) ROC-AUC (macro OvO): 0.539 +/- 0.095 (in 3 folds) au-PRC (weighted OvO): 0.607 +/- 0.062 (in 3 folds) au-PRC (macro OvO): 0.604 +/- 0.056 (in 3 folds) Accuracy: 0.210 +/- 0.054 (in 3 folds) MCC: 0.081 +/- 0.100 (in 3 folds) Global scores without abstention: Accuracy: 0.216 MCC: 0.065 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.146 +/- 0.126 (in 3 folds) MCC: 0.068 +/- 0.112 (in 3 folds) Unknown/abstention proportion: 0.487 +/- 0.603 (in 2 folds) ROC-AUC (weighted OvO): 0.645 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.644 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.678 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.668 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.152 MCC: 0.035 Unknown/abstention proportion: 0.298 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.27 0.29 0.28 35  30-40 0.20 0.09 0.12 23  40-50 0.00 0.00 0.00 28  50-60 0.17 0.18 0.17 39  60-70 0.14 0.15 0.15 27  70-80 0.00 0.00 0.00 4  <20 0.35 0.17 0.23 35  Unknown 0.00 0.00 0.00 0  accuracy 0.15 191  macro avg 0.14 0.11 0.12 191 weighted avg 0.19 0.15 0.16 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.544 +/- 0.066 (in 3 folds) ROC-AUC (macro OvO): 0.541 +/- 0.070 (in 3 folds) au-PRC (weighted OvO): 0.600 +/- 0.053 (in 3 folds) au-PRC (macro OvO): 0.601 +/- 0.056 (in 3 folds) Accuracy: 0.201 +/- 0.010 (in 3 folds) MCC: 0.065 +/- 0.032 (in 3 folds) Global scores without abstention: Accuracy: 0.203 MCC: 0.052 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.168 +/- 0.055 (in 3 folds) MCC: 0.056 +/- 0.036 (in 3 folds) Unknown/abstention proportion: 0.254 +/- 0.262 (in 2 folds) ROC-AUC (weighted OvO): 0.619 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.621 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.648 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.649 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.168 MCC: 0.042 Unknown/abstention proportion: 0.173 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.30 0.17 0.22 35  30-40 0.07 0.04 0.05 23  40-50 0.18 0.14 0.16 28  50-60 0.35 0.33 0.34 39  60-70 0.15 0.22 0.18 27  70-80 0.00 0.00 0.00 4  <20 0.12 0.06 0.08 35  Unknown 0.00 0.00 0.00 0  accuracy 0.17 191  macro avg 0.15 0.12 0.13 191 weighted avg 0.20 0.17 0.18 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.544 +/- 0.066 (in 3 folds) ROC-AUC (macro OvO): 0.541 +/- 0.070 (in 3 folds) au-PRC (weighted OvO): 0.600 +/- 0.053 (in 3 folds) au-PRC (macro OvO): 0.601 +/- 0.056 (in 3 folds) Accuracy: 0.200 +/- 0.048 (in 3 folds) MCC: 0.081 +/- 0.065 (in 3 folds) Global scores without abstention: Accuracy: 0.209 MCC: 0.050 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.172 +/- 0.081 (in 3 folds) MCC: 0.073 +/- 0.073 (in 3 folds) Unknown/abstention proportion: 0.254 +/- 0.262 (in 2 folds) ROC-AUC (weighted OvO): 0.619 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.621 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.648 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.649 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.173 MCC: 0.038 Unknown/abstention proportion: 0.173 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.28 0.29 0.28 35  30-40 0.00 0.00 0.00 23  40-50 0.00 0.00 0.00 28  50-60 0.14 0.13 0.14 39  60-70 0.16 0.33 0.22 27  70-80 0.00 0.00 0.00 4  <20 0.33 0.26 0.29 35  Unknown 0.00 0.00 0.00 0  accuracy 0.17 191  macro avg 0.11 0.13 0.12 191 weighted avg 0.16 0.17 0.16 191
,,,


ridge_cv,ridge_cv.decision_thresholds_tuned,xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.537 +/- 0.015 (in 3 folds) ROC-AUC (macro OvO): 0.536 +/- 0.018 (in 3 folds) au-PRC (weighted OvO): 0.608 +/- 0.021 (in 3 folds) au-PRC (macro OvO): 0.614 +/- 0.025 (in 3 folds) Accuracy: 0.091 +/- 0.084 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.108 MCC: -0.051 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.531 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.533 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.585 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.585 +/- 0.000 (in 1 folds) Accuracy: 0.045 +/- 0.055 (in 3 folds) MCC: -0.015 +/- 0.015 (in 3 folds) Unknown/abstention proportion: 0.867 +/- 0.066 (in 2 folds) Global scores with abstention: Accuracy: 0.047 MCC: -0.061 Unknown/abstention proportion: 0.565 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.00 0.00 0.00 35  30-40 0.00 0.00 0.00 23  40-50 0.00 0.00 0.00 28  50-60 0.12 0.23 0.15 39  60-70 0.00 0.00 0.00 27  70-80 0.00 0.00 0.00 4  <20 0.00 0.00 0.00 35  Unknown 0.00 0.00 0.00 0  accuracy 0.05 191  macro avg 0.01 0.03 0.02 191 weighted avg 0.02 0.05 0.03 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.537 +/- 0.015 (in 3 folds) ROC-AUC (macro OvO): 0.536 +/- 0.018 (in 3 folds) au-PRC (weighted OvO): 0.608 +/- 0.021 (in 3 folds) au-PRC (macro OvO): 0.614 +/- 0.025 (in 3 folds) Accuracy: 0.131 +/- 0.118 (in 3 folds) MCC: 0.039 +/- 0.068 (in 3 folds) Global scores without abstention: Accuracy: 0.205 MCC: 0.081 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.531 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.533 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.585 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.585 +/- 0.000 (in 1 folds) Accuracy: 0.086 +/- 0.124 (in 3 folds) MCC: 0.025 +/- 0.081 (in 3 folds) Unknown/abstention proportion: 0.867 +/- 0.066 (in 2 folds) Global scores with abstention: Accuracy: 0.089 MCC: 0.008 Unknown/abstention proportion: 0.565 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.28 0.14 0.19 35  30-40 0.00 0.00 0.00 23  40-50 0.00 0.00 0.00 28  50-60 0.15 0.18 0.16 39  60-70 0.00 0.00 0.00 27  70-80 0.00 0.00 0.00 4  <20 0.50 0.14 0.22 35  Unknown 0.00 0.00 0.00 0  accuracy 0.09 191  macro avg 0.12 0.06 0.07 191 weighted avg 0.17 0.09 0.11 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.519 +/- 0.028 (in 3 folds) ROC-AUC (macro OvO): 0.519 +/- 0.034 (in 3 folds) au-PRC (weighted OvO): 0.577 +/- 0.019 (in 3 folds) au-PRC (macro OvO): 0.578 +/- 0.029 (in 3 folds) Accuracy: 0.191 +/- 0.060 (in 3 folds) MCC: 0.048 +/- 0.065 (in 3 folds) Global scores without abstention: Accuracy: 0.172 MCC: 0.005 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.116 +/- 0.069 (in 3 folds) MCC: 0.019 +/- 0.029 (in 3 folds) Unknown/abstention proportion: 0.317 +/- 0.437 (in 3 folds) Global scores with abstention: Accuracy: 0.115 MCC: 0.003 Unknown/abstention proportion: 0.330 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.19 0.11 0.14 35  30-40 0.00 0.00 0.00 23  40-50 0.19 0.18 0.19 28  50-60 0.14 0.10 0.12 39  60-70 0.33 0.11 0.17 27  70-80 0.00 0.00 0.00 4  <20 0.25 0.17 0.20 35  Unknown 0.00 0.00 0.00 0  accuracy 0.12 191  macro avg 0.14 0.08 0.10 191 weighted avg 0.19 0.12 0.14 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.519 +/- 0.028 (in 3 folds) ROC-AUC (macro OvO): 0.519 +/- 0.034 (in 3 folds) au-PRC (weighted OvO): 0.577 +/- 0.019 (in 3 folds) au-PRC (macro OvO): 0.578 +/- 0.029 (in 3 folds) Accuracy: 0.197 +/- 0.120 (in 3 folds) MCC: 0.048 +/- 0.105 (in 3 folds) Global scores without abstention: Accuracy: 0.148 MCC: -0.023 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.100 +/- 0.038 (in 3 folds) MCC: 0.014 +/- 0.039 (in 3 folds) Unknown/abstention proportion: 0.317 +/- 0.437 (in 3 folds) Global scores with abstention: Accuracy: 0.099 MCC: -0.018 Unknown/abstention proportion: 0.330 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.00 0.00 0.00 35  30-40 0.00 0.00 0.00 23  40-50 0.20 0.04 0.06 28  50-60 0.09 0.08 0.08 39  60-70 0.38 0.11 0.17 27  70-80 0.00 0.00 0.00 4  <20 0.25 0.34 0.29 35  Unknown 0.00 0.00 0.00 0  accuracy 0.10 191  macro avg 0.11 0.07 0.08 191 weighted avg 0.15 0.10 0.10 191
,,,


rf_multiclass,rf_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.516 +/- 0.040 (in 3 folds) ROC-AUC (macro OvO): 0.512 +/- 0.044 (in 3 folds) au-PRC (weighted OvO): 0.561 +/- 0.028 (in 3 folds) au-PRC (macro OvO): 0.560 +/- 0.033 (in 3 folds) Accuracy: 0.139 +/- 0.045 (in 3 folds) MCC: -0.030 +/- 0.027 (in 3 folds) Global scores without abstention: Accuracy: 0.139 MCC: -0.069 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.531 +/- 0.042 (in 2 folds) ROC-AUC (macro OvO): 0.531 +/- 0.041 (in 2 folds) au-PRC (weighted OvO): 0.574 +/- 0.023 (in 2 folds) au-PRC (macro OvO): 0.576 +/- 0.023 (in 2 folds) Accuracy: 0.136 +/- 0.044 (in 3 folds) MCC: -0.029 +/- 0.028 (in 3 folds) Unknown/abstention proportion: 0.069 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.136 MCC: -0.067 Unknown/abstention proportion: 0.021 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.14 0.06 0.08 35  30-40 0.00 0.00 0.00 23  40-50 0.13 0.07 0.09 28  50-60 0.16 0.49 0.24 39  60-70 0.07 0.04 0.05 27  70-80 0.00 0.00 0.00 4  <20 0.11 0.06 0.08 35  Unknown 0.00 0.00 0.00 0  accuracy 0.14 191  macro avg 0.08 0.09 0.07 191 weighted avg 0.11 0.14 0.10 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.516 +/- 0.040 (in 3 folds) ROC-AUC (macro OvO): 0.512 +/- 0.044 (in 3 folds) au-PRC (weighted OvO): 0.561 +/- 0.028 (in 3 folds) au-PRC (macro OvO): 0.560 +/- 0.033 (in 3 folds) Accuracy: 0.172 +/- 0.090 (in 3 folds) MCC: 0.022 +/- 0.073 (in 3 folds) Global scores without abstention: Accuracy: 0.171 MCC: 0.005 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.531 +/- 0.042 (in 2 folds) ROC-AUC (macro OvO): 0.531 +/- 0.041 (in 2 folds) au-PRC (weighted OvO): 0.574 +/- 0.023 (in 2 folds) au-PRC (macro OvO): 0.576 +/- 0.023 (in 2 folds) Accuracy: 0.167 +/- 0.089 (in 3 folds) MCC: 0.024 +/- 0.073 (in 3 folds) Unknown/abstention proportion: 0.069 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.168 MCC: 0.004 Unknown/abstention proportion: 0.021 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.19 0.17 0.18 35  30-40 0.12 0.09 0.10 23  40-50 0.00 0.00 0.00 28  50-60 0.07 0.08 0.07 39  60-70 0.15 0.15 0.15 27  70-80 0.00 0.00 0.00 4  <20 0.30 0.49 0.37 35  Unknown 0.00 0.00 0.00 0  accuracy 0.17 191  macro avg 0.10 0.12 0.11 191 weighted avg 0.14 0.17 0.15 191
,


---

# GeneLocus.BCR, TargetObsColumnEnum.age_group_binary_healthy_only trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
xgboost,0.667 +/- 0.110 (in 3 folds),0.667 +/- 0.110 (in 3 folds),0.778 +/- 0.105 (in 3 folds),0.778 +/- 0.105 (in 3 folds),0.679 +/- 0.057 (in 3 folds),0.314 +/- 0.119 (in 3 folds),0.673,0.264,0.513 +/- 0.150 (in 3 folds),0.205 +/- 0.036 (in 3 folds),0.354 +/- 0.190 (in 2 folds),0.515,0.168,0.235,Unknown,101.0,31.0,132.0,0.234848,False,0.563 +/- 0.000 (in 1 folds),0.563 +/- 0.000 (in 1 folds),0.657 +/- 0.000 (in 1 folds),0.657 +/- 0.000 (in 1 folds)
rf_multiclass,0.616 +/- 0.156 (in 3 folds),0.616 +/- 0.156 (in 3 folds),0.756 +/- 0.062 (in 3 folds),0.756 +/- 0.062 (in 3 folds),0.674 +/- 0.065 (in 3 folds),0.252 +/- 0.196 (in 3 folds),0.664,0.212,0.554 +/- 0.156 (in 3 folds),0.168 +/- 0.095 (in 3 folds),0.489 +/- 0.000 (in 1 folds),0.553,0.153,0.167,Unknown,110.0,22.0,132.0,0.166667,False,0.543 +/- 0.129 (in 2 folds),0.543 +/- 0.129 (in 2 folds),0.720 +/- 0.009 (in 2 folds),0.720 +/- 0.009 (in 2 folds)
lasso_cv,0.608 +/- 0.106 (in 3 folds),0.608 +/- 0.106 (in 3 folds),0.736 +/- 0.129 (in 3 folds),0.736 +/- 0.129 (in 3 folds),0.538 +/- 0.116 (in 3 folds),0.115 +/- 0.099 (in 3 folds),0.565,0.11,0.367 +/- 0.190 (in 3 folds),0.080 +/- 0.043 (in 3 folds),0.350 +/- 0.243 (in 3 folds),0.364,0.061,0.356,Unknown,85.0,47.0,132.0,0.356061,False,,,,
lasso_multiclass,0.597 +/- 0.115 (in 3 folds),0.597 +/- 0.115 (in 3 folds),0.749 +/- 0.105 (in 3 folds),0.749 +/- 0.105 (in 3 folds),0.640 +/- 0.051 (in 3 folds),0.233 +/- 0.106 (in 3 folds),0.64,0.206,0.550 +/- 0.084 (in 3 folds),0.175 +/- 0.055 (in 3 folds),0.210 +/- 0.014 (in 2 folds),0.553,0.154,0.136,Unknown,114.0,18.0,132.0,0.136364,False,0.466 +/- 0.000 (in 1 folds),0.466 +/- 0.000 (in 1 folds),0.637 +/- 0.000 (in 1 folds),0.637 +/- 0.000 (in 1 folds)
linearsvm_ovr,0.596 +/- 0.117 (in 3 folds),0.596 +/- 0.117 (in 3 folds),0.747 +/- 0.108 (in 3 folds),0.747 +/- 0.108 (in 3 folds),0.647 +/- 0.051 (in 3 folds),0.249 +/- 0.087 (in 3 folds),0.649,0.221,0.557 +/- 0.094 (in 3 folds),0.191 +/- 0.047 (in 3 folds),0.210 +/- 0.014 (in 2 folds),0.561,0.164,0.136,Unknown,114.0,18.0,132.0,0.136364,False,0.461 +/- 0.000 (in 1 folds),0.461 +/- 0.000 (in 1 folds),0.631 +/- 0.000 (in 1 folds),0.631 +/- 0.000 (in 1 folds)
dummy_stratified,0.584 +/- 0.016 (in 3 folds),0.584 +/- 0.016 (in 3 folds),0.728 +/- 0.120 (in 3 folds),0.728 +/- 0.120 (in 3 folds),0.502 +/- 0.148 (in 3 folds),0.168 +/- 0.030 (in 3 folds),0.573,0.119,0.315 +/- 0.281 (in 3 folds),0.070 +/- 0.073 (in 3 folds),0.671 +/- 0.258 (in 2 folds),0.326,0.057,0.432,Unknown,75.0,57.0,132.0,0.431818,False,0.568 +/- 0.000 (in 1 folds),0.568 +/- 0.000 (in 1 folds),0.664 +/- 0.000 (in 1 folds),0.664 +/- 0.000 (in 1 folds)
elasticnet_cv,0.514 +/- 0.039 (in 3 folds),0.514 +/- 0.039 (in 3 folds),0.638 +/- 0.118 (in 3 folds),0.638 +/- 0.118 (in 3 folds),0.433 +/- 0.019 (in 3 folds),0.089 +/- 0.155 (in 3 folds),0.435,0.202,0.208 +/- 0.094 (in 3 folds),0.086 +/- 0.081 (in 3 folds),0.523 +/- 0.199 (in 3 folds),0.205,0.072,0.53,Unknown,62.0,70.0,132.0,0.530303,False,,,,
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.613 +/- 0.067 (in 3 folds),0.613 +/- 0.067 (in 3 folds),0.387 +/- 0.067 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.371,0.0,0.176 +/- 0.038 (in 3 folds),0.051 +/- 0.021 (in 3 folds),0.523 +/- 0.199 (in 3 folds),0.174,0.03,0.53,Unknown,62.0,70.0,132.0,0.530303,True,,,,
ridge_cv,0.495 +/- 0.009 (in 3 folds),0.495 +/- 0.009 (in 3 folds),0.610 +/- 0.071 (in 3 folds),0.610 +/- 0.071 (in 3 folds),0.387 +/- 0.067 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.371,0.0,0.176 +/- 0.038 (in 3 folds),0.051 +/- 0.021 (in 3 folds),0.523 +/- 0.199 (in 3 folds),0.174,0.03,0.53,Unknown,62.0,70.0,132.0,0.530303,True,,,,
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
xgboost,0.667 +/- 0.110 (in 3 folds),0.667 +/- 0.110 (in 3 folds),0.778 +/- 0.105 (in 3 folds),0.778 +/- 0.105 (in 3 folds),0.679 +/- 0.057 (in 3 folds),0.314 +/- 0.119 (in 3 folds),0.673,0.264,0.513 +/- 0.150 (in 3 folds),0.205 +/- 0.036 (in 3 folds),0.354 +/- 0.190 (in 2 folds),0.515,0.168,0.235,Unknown,101,31,132,0.234848,False,0.563 +/- 0.000 (in 1 folds),0.563 +/- 0.000 (in 1 folds),0.657 +/- 0.000 (in 1 folds),0.657 +/- 0.000 (in 1 folds)
rf_multiclass,0.616 +/- 0.156 (in 3 folds),0.616 +/- 0.156 (in 3 folds),0.756 +/- 0.062 (in 3 folds),0.756 +/- 0.062 (in 3 folds),0.674 +/- 0.065 (in 3 folds),0.252 +/- 0.196 (in 3 folds),0.664,0.212,0.554 +/- 0.156 (in 3 folds),0.168 +/- 0.095 (in 3 folds),0.489 +/- 0.000 (in 1 folds),0.553,0.153,0.167,Unknown,110,22,132,0.166667,False,0.543 +/- 0.129 (in 2 folds),0.543 +/- 0.129 (in 2 folds),0.720 +/- 0.009 (in 2 folds),0.720 +/- 0.009 (in 2 folds)
lasso_cv,0.608 +/- 0.106 (in 3 folds),0.608 +/- 0.106 (in 3 folds),0.736 +/- 0.129 (in 3 folds),0.736 +/- 0.129 (in 3 folds),0.538 +/- 0.116 (in 3 folds),0.115 +/- 0.099 (in 3 folds),0.565,0.11,0.367 +/- 0.190 (in 3 folds),0.080 +/- 0.043 (in 3 folds),0.350 +/- 0.243 (in 3 folds),0.364,0.061,0.356,Unknown,85,47,132,0.356061,False,,,,
lasso_multiclass,0.597 +/- 0.115 (in 3 folds),0.597 +/- 0.115 (in 3 folds),0.749 +/- 0.105 (in 3 folds),0.749 +/- 0.105 (in 3 folds),0.640 +/- 0.051 (in 3 folds),0.233 +/- 0.106 (in 3 folds),0.64,0.206,0.550 +/- 0.084 (in 3 folds),0.175 +/- 0.055 (in 3 folds),0.210 +/- 0.014 (in 2 folds),0.553,0.154,0.136,Unknown,114,18,132,0.136364,False,0.466 +/- 0.000 (in 1 folds),0.466 +/- 0.000 (in 1 folds),0.637 +/- 0.000 (in 1 folds),0.637 +/- 0.000 (in 1 folds)
linearsvm_ovr,0.596 +/- 0.117 (in 3 folds),0.596 +/- 0.117 (in 3 folds),0.747 +/- 0.108 (in 3 folds),0.747 +/- 0.108 (in 3 folds),0.647 +/- 0.051 (in 3 folds),0.249 +/- 0.087 (in 3 folds),0.649,0.221,0.557 +/- 0.094 (in 3 folds),0.191 +/- 0.047 (in 3 folds),0.210 +/- 0.014 (in 2 folds),0.561,0.164,0.136,Unknown,114,18,132,0.136364,False,0.461 +/- 0.000 (in 1 folds),0.461 +/- 0.000 (in 1 folds),0.631 +/- 0.000 (in 1 folds),0.631 +/- 0.000 (in 1 folds)
dummy_stratified,0.584 +/- 0.016 (in 3 folds),0.584 +/- 0.016 (in 3 folds),0.728 +/- 0.120 (in 3 folds),0.728 +/- 0.120 (in 3 folds),0.502 +/- 0.148 (in 3 folds),0.168 +/- 0.030 (in 3 folds),0.573,0.119,0.315 +/- 0.281 (in 3 folds),0.070 +/- 0.073 (in 3 folds),0.671 +/- 0.258 (in 2 folds),0.326,0.057,0.432,Unknown,75,57,132,0.431818,False,0.568 +/- 0.000 (in 1 folds),0.568 +/- 0.000 (in 1 folds),0.664 +/- 0.000 (in 1 folds),0.664 +/- 0.000 (in 1 folds)
elasticnet_cv,0.514 +/- 0.039 (in 3 folds),0.514 +/- 0.039 (in 3 folds),0.638 +/- 0.118 (in 3 folds),0.638 +/- 0.118 (in 3 folds),0.433 +/- 0.019 (in 3 folds),0.089 +/- 0.155 (in 3 folds),0.435,0.202,0.208 +/- 0.094 (in 3 folds),0.086 +/- 0.081 (in 3 folds),0.523 +/- 0.199 (in 3 folds),0.205,0.072,0.53,Unknown,62,70,132,0.530303,False,,,,
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.613 +/- 0.067 (in 3 folds),0.613 +/- 0.067 (in 3 folds),0.387 +/- 0.067 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.371,0.0,0.176 +/- 0.038 (in 3 folds),0.051 +/- 0.021 (in 3 folds),0.523 +/- 0.199 (in 3 folds),0.174,0.03,0.53,Unknown,62,70,132,0.530303,True,,,,
ridge_cv,0.495 +/- 0.009 (in 3 folds),0.495 +/- 0.009 (in 3 folds),0.610 +/- 0.071 (in 3 folds),0.610 +/- 0.071 (in 3 folds),0.387 +/- 0.067 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.371,0.0,0.176 +/- 0.038 (in 3 folds),0.051 +/- 0.021 (in 3 folds),0.523 +/- 0.199 (in 3 folds),0.174,0.03,0.53,Unknown,62,70,132,0.530303,True,,,,


xgboost,rf_multiclass,lasso_cv,lasso_multiclass
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.667 +/- 0.110 (in 3 folds) ROC-AUC (macro OvO): 0.667 +/- 0.110 (in 3 folds) au-PRC (weighted OvO): 0.778 +/- 0.105 (in 3 folds) au-PRC (macro OvO): 0.778 +/- 0.105 (in 3 folds) Accuracy: 0.679 +/- 0.057 (in 3 folds) MCC: 0.314 +/- 0.119 (in 3 folds) Global scores without abstention: Accuracy: 0.673 MCC: 0.264 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.513 +/- 0.150 (in 3 folds) MCC: 0.205 +/- 0.036 (in 3 folds) Unknown/abstention proportion: 0.354 +/- 0.190 (in 2 folds) ROC-AUC (weighted OvO): 0.563 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.563 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.657 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.657 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.515 MCC: 0.168 Unknown/abstention proportion: 0.235 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.53 0.38 0.44 45  Unknown 0.00 0.00 0.00 0  under 50 0.74 0.59 0.65 87  accuracy 0.52 132  macro avg 0.42 0.32 0.37 132 weighted avg 0.67 0.52 0.58 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.616 +/- 0.156 (in 3 folds) ROC-AUC (macro OvO): 0.616 +/- 0.156 (in 3 folds) au-PRC (weighted OvO): 0.756 +/- 0.062 (in 3 folds) au-PRC (macro OvO): 0.756 +/- 0.062 (in 3 folds) Accuracy: 0.674 +/- 0.065 (in 3 folds) MCC: 0.252 +/- 0.196 (in 3 folds) Global scores without abstention: Accuracy: 0.664 MCC: 0.212 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.554 +/- 0.156 (in 3 folds) MCC: 0.168 +/- 0.095 (in 3 folds) Unknown/abstention proportion: 0.489 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.543 +/- 0.129 (in 2 folds) ROC-AUC (macro OvO): 0.543 +/- 0.129 (in 2 folds) au-PRC (weighted OvO): 0.720 +/- 0.009 (in 2 folds) au-PRC (macro OvO): 0.720 +/- 0.009 (in 2 folds) Global scores with abstention: Accuracy: 0.553 MCC: 0.153 Unknown/abstention proportion: 0.167 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.50 0.33 0.40 45  Unknown 0.00 0.00 0.00 0  under 50 0.72 0.67 0.69 87  accuracy 0.55 132  macro avg 0.41 0.33 0.36 132 weighted avg 0.65 0.55 0.59 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.608 +/- 0.106 (in 3 folds) ROC-AUC (macro OvO): 0.608 +/- 0.106 (in 3 folds) au-PRC (weighted OvO): 0.736 +/- 0.129 (in 3 folds) au-PRC (macro OvO): 0.736 +/- 0.129 (in 3 folds) Accuracy: 0.538 +/- 0.116 (in 3 folds) MCC: 0.115 +/- 0.099 (in 3 folds) Global scores without abstention: Accuracy: 0.565 MCC: 0.110 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.367 +/- 0.190 (in 3 folds) MCC: 0.080 +/- 0.043 (in 3 folds) Unknown/abstention proportion: 0.350 +/- 0.243 (in 3 folds) Global scores with abstention: Accuracy: 0.364 MCC: 0.061 Unknown/abstention proportion: 0.356 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.41 0.36 0.38 45  Unknown 0.00 0.00 0.00 0  under 50 0.70 0.37 0.48 87  accuracy 0.36 132  macro avg 0.37 0.24 0.29 132 weighted avg 0.60 0.36 0.45 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.597 +/- 0.115 (in 3 folds) ROC-AUC (macro OvO): 0.597 +/- 0.115 (in 3 folds) au-PRC (weighted OvO): 0.749 +/- 0.105 (in 3 folds) au-PRC (macro OvO): 0.749 +/- 0.105 (in 3 folds) Accuracy: 0.640 +/- 0.051 (in 3 folds) MCC: 0.233 +/- 0.106 (in 3 folds) Global scores without abstention: Accuracy: 0.640 MCC: 0.206 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.550 +/- 0.084 (in 3 folds) MCC: 0.175 +/- 0.055 (in 3 folds) Unknown/abstention proportion: 0.210 +/- 0.014 (in 2 folds) ROC-AUC (weighted OvO): 0.466 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.466 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.637 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.637 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.553 MCC: 0.154 Unknown/abstention proportion: 0.136 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.49 0.42 0.45 45  Unknown 0.00 0.00 0.00 0  under 50 0.72 0.62 0.67 87  accuracy 0.55 132  macro avg 0.40 0.35 0.37 132 weighted avg 0.64 0.55 0.59 132
,,,


linearsvm_ovr,dummy_stratified,elasticnet_cv,dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.596 +/- 0.117 (in 3 folds) ROC-AUC (macro OvO): 0.596 +/- 0.117 (in 3 folds) au-PRC (weighted OvO): 0.747 +/- 0.108 (in 3 folds) au-PRC (macro OvO): 0.747 +/- 0.108 (in 3 folds) Accuracy: 0.647 +/- 0.051 (in 3 folds) MCC: 0.249 +/- 0.087 (in 3 folds) Global scores without abstention: Accuracy: 0.649 MCC: 0.221 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.557 +/- 0.094 (in 3 folds) MCC: 0.191 +/- 0.047 (in 3 folds) Unknown/abstention proportion: 0.210 +/- 0.014 (in 2 folds) ROC-AUC (weighted OvO): 0.461 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.461 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.631 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.631 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.561 MCC: 0.164 Unknown/abstention proportion: 0.136 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.50 0.42 0.46 45  Unknown 0.00 0.00 0.00 0  under 50 0.72 0.63 0.67 87  accuracy 0.56 132  macro avg 0.41 0.35 0.38 132 weighted avg 0.65 0.56 0.60 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.584 +/- 0.016 (in 3 folds) ROC-AUC (macro OvO): 0.584 +/- 0.016 (in 3 folds) au-PRC (weighted OvO): 0.728 +/- 0.120 (in 3 folds) au-PRC (macro OvO): 0.728 +/- 0.120 (in 3 folds) Accuracy: 0.502 +/- 0.148 (in 3 folds) MCC: 0.168 +/- 0.030 (in 3 folds) Global scores without abstention: Accuracy: 0.573 MCC: 0.119 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.315 +/- 0.281 (in 3 folds) MCC: 0.070 +/- 0.073 (in 3 folds) Unknown/abstention proportion: 0.671 +/- 0.258 (in 2 folds) ROC-AUC (weighted OvO): 0.568 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.568 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.664 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.664 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.326 MCC: 0.057 Unknown/abstention proportion: 0.432 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.42 0.31 0.36 45  Unknown 0.00 0.00 0.00 0  under 50 0.69 0.33 0.45 87  accuracy 0.33 132  macro avg 0.37 0.21 0.27 132 weighted avg 0.60 0.33 0.42 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.514 +/- 0.039 (in 3 folds) ROC-AUC (macro OvO): 0.514 +/- 0.039 (in 3 folds) au-PRC (weighted OvO): 0.638 +/- 0.118 (in 3 folds) au-PRC (macro OvO): 0.638 +/- 0.118 (in 3 folds) Accuracy: 0.433 +/- 0.019 (in 3 folds) MCC: 0.089 +/- 0.155 (in 3 folds) Global scores without abstention: Accuracy: 0.435 MCC: 0.202 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.208 +/- 0.094 (in 3 folds) MCC: 0.086 +/- 0.081 (in 3 folds) Unknown/abstention proportion: 0.523 +/- 0.199 (in 3 folds) Global scores with abstention: Accuracy: 0.205 MCC: 0.072 Unknown/abstention proportion: 0.530 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.40 0.51 0.45 45  Unknown 0.00 0.00 0.00 0  under 50 1.00 0.05 0.09 87  accuracy 0.20 132  macro avg 0.47 0.19 0.18 132 weighted avg 0.79 0.20 0.21 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.613 +/- 0.067 (in 3 folds) au-PRC (macro OvO): 0.613 +/- 0.067 (in 3 folds) Accuracy: 0.387 +/- 0.067 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.371 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.176 +/- 0.038 (in 3 folds) MCC: 0.051 +/- 0.021 (in 3 folds) Unknown/abstention proportion: 0.523 +/- 0.199 (in 3 folds) Global scores with abstention: Accuracy: 0.174 MCC: 0.030 Unknown/abstention proportion: 0.530 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.37 0.51 0.43 45  Unknown 0.00 0.00 0.00 0  under 50 0.00 0.00 0.00 87  accuracy 0.17 132  macro avg 0.12 0.17 0.14 132 weighted avg 0.13 0.17 0.15 132
,,,


ridge_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.495 +/- 0.009 (in 3 folds) ROC-AUC (macro OvO): 0.495 +/- 0.009 (in 3 folds) au-PRC (weighted OvO): 0.610 +/- 0.071 (in 3 folds) au-PRC (macro OvO): 0.610 +/- 0.071 (in 3 folds) Accuracy: 0.387 +/- 0.067 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.371 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.176 +/- 0.038 (in 3 folds) MCC: 0.051 +/- 0.021 (in 3 folds) Unknown/abstention proportion: 0.523 +/- 0.199 (in 3 folds) Global scores with abstention: Accuracy: 0.174 MCC: 0.030 Unknown/abstention proportion: 0.530 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.37 0.51 0.43 45  Unknown 0.00 0.00 0.00 0  under 50 0.00 0.00 0.00 87  accuracy 0.17 132  macro avg 0.12 0.17 0.14 132 weighted avg 0.13 0.17 0.15 132


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
rf_multiclass,0.608 +/- 0.048 (in 3 folds),0.608 +/- 0.048 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.602 +/- 0.027 (in 3 folds),0.159 +/- 0.028 (in 3 folds),0.605,0.142,0.532 +/- 0.126 (in 3 folds),0.133 +/- 0.052 (in 3 folds),0.120 +/- 0.180 (in 3 folds),0.529,0.109,0.126,Unknown,167.0,24.0,191.0,0.125654,False
rf_multiclass.decision_thresholds_tuned,0.608 +/- 0.048 (in 3 folds),0.608 +/- 0.048 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.608 +/- 0.027 (in 3 folds),0.167 +/- 0.047 (in 3 folds),0.611,0.142,0.538 +/- 0.130 (in 3 folds),0.140 +/- 0.062 (in 3 folds),0.120 +/- 0.180 (in 3 folds),0.534,0.107,0.126,Unknown,167.0,24.0,191.0,0.125654,False
xgboost,0.607 +/- 0.069 (in 3 folds),0.607 +/- 0.069 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.581 +/- 0.004 (in 3 folds),0.172 +/- 0.072 (in 3 folds),0.581,0.137,0.476 +/- 0.091 (in 3 folds),0.128 +/- 0.058 (in 3 folds),0.181 +/- 0.156 (in 3 folds),0.471,0.096,0.188,Unknown,155.0,36.0,191.0,0.188482,False
xgboost.decision_thresholds_tuned,0.607 +/- 0.069 (in 3 folds),0.607 +/- 0.069 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.549 +/- 0.067 (in 3 folds),0.173 +/- 0.046 (in 3 folds),0.548,0.098,0.451 +/- 0.117 (in 3 folds),0.130 +/- 0.048 (in 3 folds),0.181 +/- 0.156 (in 3 folds),0.445,0.071,0.188,Unknown,155.0,36.0,191.0,0.188482,False
lasso_cv,0.598 +/- 0.100 (in 3 folds),0.598 +/- 0.100 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.531 +/- 0.082 (in 3 folds),0.048 +/- 0.135 (in 3 folds),0.56,0.086,0.356 +/- 0.205 (in 3 folds),0.029 +/- 0.106 (in 3 folds),0.362 +/- 0.314 (in 3 folds),0.366,0.049,0.346,Unknown,125.0,66.0,191.0,0.34555,False
lasso_cv.decision_thresholds_tuned,0.598 +/- 0.100 (in 3 folds),0.598 +/- 0.100 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.541 +/- 0.062 (in 3 folds),0.118 +/- 0.110 (in 3 folds),0.536,0.096,0.342 +/- 0.172 (in 3 folds),0.088 +/- 0.076 (in 3 folds),0.362 +/- 0.314 (in 3 folds),0.351,0.054,0.346,Unknown,125.0,66.0,191.0,0.34555,False
elasticnet_cv,0.576 +/- 0.083 (in 3 folds),0.576 +/- 0.083 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.400 +/- 0.040 (in 3 folds),0.009 +/- 0.015 (in 3 folds),0.396,0.019,0.186 +/- 0.089 (in 3 folds),0.035 +/- 0.056 (in 3 folds),0.531 +/- 0.223 (in 3 folds),0.188,0.02,0.524,Unknown,91.0,100.0,191.0,0.52356,False
elasticnet_cv.decision_thresholds_tuned,0.576 +/- 0.083 (in 3 folds),0.576 +/- 0.083 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.537 +/- 0.121 (in 3 folds),0.036 +/- 0.042 (in 3 folds),0.505,0.014,0.237 +/- 0.072 (in 3 folds),0.038 +/- 0.053 (in 3 folds),0.531 +/- 0.223 (in 3 folds),0.241,0.006,0.524,Unknown,91.0,100.0,191.0,0.52356,False
linearsvm_ovr,0.573 +/- 0.073 (in 3 folds),0.573 +/- 0.073 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.583 +/- 0.043 (in 3 folds),0.152 +/- 0.086 (in 3 folds),0.584,0.13,0.513 +/- 0.096 (in 3 folds),0.127 +/- 0.093 (in 3 folds),0.126 +/- 0.096 (in 3 folds),0.508,0.097,0.131,Unknown,166.0,25.0,191.0,0.13089,False
linearsvm_ovr.decision_thresholds_tuned,0.573 +/- 0.073 (in 3 folds),0.573 +/- 0.073 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.535 +/- 0.055 (in 3 folds),0.091 +/- 0.005 (in 3 folds),0.536,0.024,0.469 +/- 0.087 (in 3 folds),0.067 +/- 0.012 (in 3 folds),0.126 +/- 0.096 (in 3 folds),0.466,0.012,0.131,Unknown,166.0,25.0,191.0,0.13089,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
rf_multiclass,0.608 +/- 0.048 (in 3 folds),0.608 +/- 0.048 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.602 +/- 0.027 (in 3 folds),0.159 +/- 0.028 (in 3 folds),0.605,0.142,0.532 +/- 0.126 (in 3 folds),0.133 +/- 0.052 (in 3 folds),0.120 +/- 0.180 (in 3 folds),0.529,0.109,0.126,Unknown,167,24,191,0.125654,False
rf_multiclass.decision_thresholds_tuned,0.608 +/- 0.048 (in 3 folds),0.608 +/- 0.048 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.701 +/- 0.111 (in 3 folds),0.608 +/- 0.027 (in 3 folds),0.167 +/- 0.047 (in 3 folds),0.611,0.142,0.538 +/- 0.130 (in 3 folds),0.140 +/- 0.062 (in 3 folds),0.120 +/- 0.180 (in 3 folds),0.534,0.107,0.126,Unknown,167,24,191,0.125654,False
xgboost,0.607 +/- 0.069 (in 3 folds),0.607 +/- 0.069 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.581 +/- 0.004 (in 3 folds),0.172 +/- 0.072 (in 3 folds),0.581,0.137,0.476 +/- 0.091 (in 3 folds),0.128 +/- 0.058 (in 3 folds),0.181 +/- 0.156 (in 3 folds),0.471,0.096,0.188,Unknown,155,36,191,0.188482,False
xgboost.decision_thresholds_tuned,0.607 +/- 0.069 (in 3 folds),0.607 +/- 0.069 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.698 +/- 0.112 (in 3 folds),0.549 +/- 0.067 (in 3 folds),0.173 +/- 0.046 (in 3 folds),0.548,0.098,0.451 +/- 0.117 (in 3 folds),0.130 +/- 0.048 (in 3 folds),0.181 +/- 0.156 (in 3 folds),0.445,0.071,0.188,Unknown,155,36,191,0.188482,False
lasso_cv,0.598 +/- 0.100 (in 3 folds),0.598 +/- 0.100 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.531 +/- 0.082 (in 3 folds),0.048 +/- 0.135 (in 3 folds),0.56,0.086,0.356 +/- 0.205 (in 3 folds),0.029 +/- 0.106 (in 3 folds),0.362 +/- 0.314 (in 3 folds),0.366,0.049,0.346,Unknown,125,66,191,0.34555,False
lasso_cv.decision_thresholds_tuned,0.598 +/- 0.100 (in 3 folds),0.598 +/- 0.100 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.704 +/- 0.124 (in 3 folds),0.541 +/- 0.062 (in 3 folds),0.118 +/- 0.110 (in 3 folds),0.536,0.096,0.342 +/- 0.172 (in 3 folds),0.088 +/- 0.076 (in 3 folds),0.362 +/- 0.314 (in 3 folds),0.351,0.054,0.346,Unknown,125,66,191,0.34555,False
elasticnet_cv,0.576 +/- 0.083 (in 3 folds),0.576 +/- 0.083 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.400 +/- 0.040 (in 3 folds),0.009 +/- 0.015 (in 3 folds),0.396,0.019,0.186 +/- 0.089 (in 3 folds),0.035 +/- 0.056 (in 3 folds),0.531 +/- 0.223 (in 3 folds),0.188,0.02,0.524,Unknown,91,100,191,0.52356,False
elasticnet_cv.decision_thresholds_tuned,0.576 +/- 0.083 (in 3 folds),0.576 +/- 0.083 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.653 +/- 0.082 (in 3 folds),0.537 +/- 0.121 (in 3 folds),0.036 +/- 0.042 (in 3 folds),0.505,0.014,0.237 +/- 0.072 (in 3 folds),0.038 +/- 0.053 (in 3 folds),0.531 +/- 0.223 (in 3 folds),0.241,0.006,0.524,Unknown,91,100,191,0.52356,False
linearsvm_ovr,0.573 +/- 0.073 (in 3 folds),0.573 +/- 0.073 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.583 +/- 0.043 (in 3 folds),0.152 +/- 0.086 (in 3 folds),0.584,0.13,0.513 +/- 0.096 (in 3 folds),0.127 +/- 0.093 (in 3 folds),0.126 +/- 0.096 (in 3 folds),0.508,0.097,0.131,Unknown,166,25,191,0.13089,False
linearsvm_ovr.decision_thresholds_tuned,0.573 +/- 0.073 (in 3 folds),0.573 +/- 0.073 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.680 +/- 0.116 (in 3 folds),0.535 +/- 0.055 (in 3 folds),0.091 +/- 0.005 (in 3 folds),0.536,0.024,0.469 +/- 0.087 (in 3 folds),0.067 +/- 0.012 (in 3 folds),0.126 +/- 0.096 (in 3 folds),0.466,0.012,0.131,Unknown,166,25,191,0.13089,False


rf_multiclass,rf_multiclass.decision_thresholds_tuned,xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.608 +/- 0.048 (in 3 folds) ROC-AUC (macro OvO): 0.608 +/- 0.048 (in 3 folds) au-PRC (weighted OvO): 0.701 +/- 0.111 (in 3 folds) au-PRC (macro OvO): 0.701 +/- 0.111 (in 3 folds) Accuracy: 0.602 +/- 0.027 (in 3 folds) MCC: 0.159 +/- 0.028 (in 3 folds) Global scores without abstention: Accuracy: 0.605 MCC: 0.142 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.532 +/- 0.126 (in 3 folds) MCC: 0.133 +/- 0.052 (in 3 folds) Unknown/abstention proportion: 0.120 +/- 0.180 (in 3 folds) Global scores with abstention: Accuracy: 0.529 MCC: 0.109 Unknown/abstention proportion: 0.126 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.47 0.39 0.42 70  Unknown 0.00 0.00 0.00 0  under 50 0.68 0.61 0.64 121  accuracy 0.53 191  macro avg 0.38 0.33 0.36 191 weighted avg 0.60 0.53 0.56 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.608 +/- 0.048 (in 3 folds) ROC-AUC (macro OvO): 0.608 +/- 0.048 (in 3 folds) au-PRC (weighted OvO): 0.701 +/- 0.111 (in 3 folds) au-PRC (macro OvO): 0.701 +/- 0.111 (in 3 folds) Accuracy: 0.608 +/- 0.027 (in 3 folds) MCC: 0.167 +/- 0.047 (in 3 folds) Global scores without abstention: Accuracy: 0.611 MCC: 0.142 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.538 +/- 0.130 (in 3 folds) MCC: 0.140 +/- 0.062 (in 3 folds) Unknown/abstention proportion: 0.120 +/- 0.180 (in 3 folds) Global scores with abstention: Accuracy: 0.534 MCC: 0.107 Unknown/abstention proportion: 0.126 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.47 0.36 0.41 70  Unknown 0.00 0.00 0.00 0  under 50 0.68 0.64 0.66 121  accuracy 0.53 191  macro avg 0.38 0.33 0.35 191 weighted avg 0.60 0.53 0.56 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.607 +/- 0.069 (in 3 folds) ROC-AUC (macro OvO): 0.607 +/- 0.069 (in 3 folds) au-PRC (weighted OvO): 0.698 +/- 0.112 (in 3 folds) au-PRC (macro OvO): 0.698 +/- 0.112 (in 3 folds) Accuracy: 0.581 +/- 0.004 (in 3 folds) MCC: 0.172 +/- 0.072 (in 3 folds) Global scores without abstention: Accuracy: 0.581 MCC: 0.137 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.476 +/- 0.091 (in 3 folds) MCC: 0.128 +/- 0.058 (in 3 folds) Unknown/abstention proportion: 0.181 +/- 0.156 (in 3 folds) Global scores with abstention: Accuracy: 0.471 MCC: 0.096 Unknown/abstention proportion: 0.188 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.46 0.44 0.45 70  Unknown 0.00 0.00 0.00 0  under 50 0.68 0.49 0.57 121  accuracy 0.47 191  macro avg 0.38 0.31 0.34 191 weighted avg 0.60 0.47 0.52 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.607 +/- 0.069 (in 3 folds) ROC-AUC (macro OvO): 0.607 +/- 0.069 (in 3 folds) au-PRC (weighted OvO): 0.698 +/- 0.112 (in 3 folds) au-PRC (macro OvO): 0.698 +/- 0.112 (in 3 folds) Accuracy: 0.549 +/- 0.067 (in 3 folds) MCC: 0.173 +/- 0.046 (in 3 folds) Global scores without abstention: Accuracy: 0.548 MCC: 0.098 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.451 +/- 0.117 (in 3 folds) MCC: 0.130 +/- 0.048 (in 3 folds) Unknown/abstention proportion: 0.181 +/- 0.156 (in 3 folds) Global scores with abstention: Accuracy: 0.445 MCC: 0.071 Unknown/abstention proportion: 0.188 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.43 0.47 0.45 70  Unknown 0.00 0.00 0.00 0  under 50 0.67 0.43 0.52 121  accuracy 0.45 191  macro avg 0.37 0.30 0.32 191 weighted avg 0.58 0.45 0.50 191
,,,


lasso_cv,lasso_cv.decision_thresholds_tuned,elasticnet_cv,elasticnet_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.598 +/- 0.100 (in 3 folds) ROC-AUC (macro OvO): 0.598 +/- 0.100 (in 3 folds) au-PRC (weighted OvO): 0.704 +/- 0.124 (in 3 folds) au-PRC (macro OvO): 0.704 +/- 0.124 (in 3 folds) Accuracy: 0.531 +/- 0.082 (in 3 folds) MCC: 0.048 +/- 0.135 (in 3 folds) Global scores without abstention: Accuracy: 0.560 MCC: 0.086 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.356 +/- 0.205 (in 3 folds) MCC: 0.029 +/- 0.106 (in 3 folds) Unknown/abstention proportion: 0.362 +/- 0.314 (in 3 folds) Global scores with abstention: Accuracy: 0.366 MCC: 0.049 Unknown/abstention proportion: 0.346 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.41 0.31 0.35 70  Unknown 0.00 0.00 0.00 0  under 50 0.68 0.40 0.50 121  accuracy 0.37 191  macro avg 0.36 0.24 0.28 191 weighted avg 0.58 0.37 0.45 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.598 +/- 0.100 (in 3 folds) ROC-AUC (macro OvO): 0.598 +/- 0.100 (in 3 folds) au-PRC (weighted OvO): 0.704 +/- 0.124 (in 3 folds) au-PRC (macro OvO): 0.704 +/- 0.124 (in 3 folds) Accuracy: 0.541 +/- 0.062 (in 3 folds) MCC: 0.118 +/- 0.110 (in 3 folds) Global scores without abstention: Accuracy: 0.536 MCC: 0.096 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.342 +/- 0.172 (in 3 folds) MCC: 0.088 +/- 0.076 (in 3 folds) Unknown/abstention proportion: 0.362 +/- 0.314 (in 3 folds) Global scores with abstention: Accuracy: 0.351 MCC: 0.054 Unknown/abstention proportion: 0.346 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.40 0.39 0.39 70  Unknown 0.00 0.00 0.00 0  under 50 0.69 0.33 0.45 121  accuracy 0.35 191  macro avg 0.36 0.24 0.28 191 weighted avg 0.58 0.35 0.43 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.576 +/- 0.083 (in 3 folds) ROC-AUC (macro OvO): 0.576 +/- 0.083 (in 3 folds) au-PRC (weighted OvO): 0.653 +/- 0.082 (in 3 folds) au-PRC (macro OvO): 0.653 +/- 0.082 (in 3 folds) Accuracy: 0.400 +/- 0.040 (in 3 folds) MCC: 0.009 +/- 0.015 (in 3 folds) Global scores without abstention: Accuracy: 0.396 MCC: 0.019 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.186 +/- 0.089 (in 3 folds) MCC: 0.035 +/- 0.056 (in 3 folds) Unknown/abstention proportion: 0.531 +/- 0.223 (in 3 folds) Global scores with abstention: Accuracy: 0.188 MCC: 0.020 Unknown/abstention proportion: 0.524 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.39 0.49 0.43 70  Unknown 0.00 0.00 0.00 0  under 50 0.67 0.02 0.03 121  accuracy 0.19 191  macro avg 0.35 0.17 0.15 191 weighted avg 0.56 0.19 0.18 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.576 +/- 0.083 (in 3 folds) ROC-AUC (macro OvO): 0.576 +/- 0.083 (in 3 folds) au-PRC (weighted OvO): 0.653 +/- 0.082 (in 3 folds) au-PRC (macro OvO): 0.653 +/- 0.082 (in 3 folds) Accuracy: 0.537 +/- 0.121 (in 3 folds) MCC: 0.036 +/- 0.042 (in 3 folds) Global scores without abstention: Accuracy: 0.505 MCC: 0.014 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.237 +/- 0.072 (in 3 folds) MCC: 0.038 +/- 0.053 (in 3 folds) Unknown/abstention proportion: 0.531 +/- 0.223 (in 3 folds) Global scores with abstention: Accuracy: 0.241 MCC: 0.006 Unknown/abstention proportion: 0.524 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.39 0.26 0.31 70  Unknown 0.00 0.00 0.00 0  under 50 0.62 0.23 0.34 121  accuracy 0.24 191  macro avg 0.34 0.16 0.22 191 weighted avg 0.54 0.24 0.33 191
,,,


linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned,lasso_multiclass,lasso_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.573 +/- 0.073 (in 3 folds) ROC-AUC (macro OvO): 0.573 +/- 0.073 (in 3 folds) au-PRC (weighted OvO): 0.680 +/- 0.116 (in 3 folds) au-PRC (macro OvO): 0.680 +/- 0.116 (in 3 folds) Accuracy: 0.583 +/- 0.043 (in 3 folds) MCC: 0.152 +/- 0.086 (in 3 folds) Global scores without abstention: Accuracy: 0.584 MCC: 0.130 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.513 +/- 0.096 (in 3 folds) MCC: 0.127 +/- 0.093 (in 3 folds) Unknown/abstention proportion: 0.126 +/- 0.096 (in 3 folds) Global scores with abstention: Accuracy: 0.508 MCC: 0.097 Unknown/abstention proportion: 0.131 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.46 0.44 0.45 70  Unknown 0.00 0.00 0.00 0  under 50 0.67 0.55 0.60 121  accuracy 0.51 191  macro avg 0.38 0.33 0.35 191 weighted avg 0.59 0.51 0.55 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.573 +/- 0.073 (in 3 folds) ROC-AUC (macro OvO): 0.573 +/- 0.073 (in 3 folds) au-PRC (weighted OvO): 0.680 +/- 0.116 (in 3 folds) au-PRC (macro OvO): 0.680 +/- 0.116 (in 3 folds) Accuracy: 0.535 +/- 0.055 (in 3 folds) MCC: 0.091 +/- 0.005 (in 3 folds) Global scores without abstention: Accuracy: 0.536 MCC: 0.024 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.469 +/- 0.087 (in 3 folds) MCC: 0.067 +/- 0.012 (in 3 folds) Unknown/abstention proportion: 0.126 +/- 0.096 (in 3 folds) Global scores with abstention: Accuracy: 0.466 MCC: 0.012 Unknown/abstention proportion: 0.131 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.40 0.37 0.39 70  Unknown 0.00 0.00 0.00 0  under 50 0.62 0.52 0.57 121  accuracy 0.47 191  macro avg 0.34 0.30 0.32 191 weighted avg 0.54 0.47 0.50 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.572 +/- 0.074 (in 3 folds) ROC-AUC (macro OvO): 0.572 +/- 0.074 (in 3 folds) au-PRC (weighted OvO): 0.680 +/- 0.116 (in 3 folds) au-PRC (macro OvO): 0.680 +/- 0.116 (in 3 folds) Accuracy: 0.578 +/- 0.034 (in 3 folds) MCC: 0.139 +/- 0.065 (in 3 folds) Global scores without abstention: Accuracy: 0.578 MCC: 0.120 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.507 +/- 0.086 (in 3 folds) MCC: 0.115 +/- 0.073 (in 3 folds) Unknown/abstention proportion: 0.126 +/- 0.096 (in 3 folds) Global scores with abstention: Accuracy: 0.503 MCC: 0.090 Unknown/abstention proportion: 0.131 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.46 0.44 0.45 70  Unknown 0.00 0.00 0.00 0  under 50 0.66 0.54 0.59 121  accuracy 0.50 191  macro avg 0.37 0.33 0.35 191 weighted avg 0.59 0.50 0.54 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.572 +/- 0.074 (in 3 folds) ROC-AUC (macro OvO): 0.572 +/- 0.074 (in 3 folds) au-PRC (weighted OvO): 0.680 +/- 0.116 (in 3 folds) au-PRC (macro OvO): 0.680 +/- 0.116 (in 3 folds) Accuracy: 0.535 +/- 0.055 (in 3 folds) MCC: 0.091 +/- 0.005 (in 3 folds) Global scores without abstention: Accuracy: 0.536 MCC: 0.024 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.469 +/- 0.087 (in 3 folds) MCC: 0.067 +/- 0.012 (in 3 folds) Unknown/abstention proportion: 0.126 +/- 0.096 (in 3 folds) Global scores with abstention: Accuracy: 0.466 MCC: 0.012 Unknown/abstention proportion: 0.131 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.40 0.37 0.39 70  Unknown 0.00 0.00 0.00 0  under 50 0.62 0.52 0.57 121  accuracy 0.47 191  macro avg 0.34 0.30 0.32 191 weighted avg 0.54 0.47 0.50 191
,,,


ridge_cv,ridge_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.521 +/- 0.037 (in 3 folds) ROC-AUC (macro OvO): 0.521 +/- 0.037 (in 3 folds) au-PRC (weighted OvO): 0.618 +/- 0.056 (in 3 folds) au-PRC (macro OvO): 0.618 +/- 0.056 (in 3 folds) Accuracy: 0.393 +/- 0.041 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.385 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.181 +/- 0.081 (in 3 folds) MCC: 0.038 +/- 0.062 (in 3 folds) Unknown/abstention proportion: 0.531 +/- 0.223 (in 3 folds) Global scores with abstention: Accuracy: 0.183 MCC: 0.018 Unknown/abstention proportion: 0.524 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.38 0.50 0.43 70  Unknown 0.00 0.00 0.00 0  under 50 0.00 0.00 0.00 121  accuracy 0.18 191  macro avg 0.13 0.17 0.14 191 weighted avg 0.14 0.18 0.16 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.521 +/- 0.037 (in 3 folds) ROC-AUC (macro OvO): 0.521 +/- 0.037 (in 3 folds) au-PRC (weighted OvO): 0.618 +/- 0.056 (in 3 folds) au-PRC (macro OvO): 0.618 +/- 0.056 (in 3 folds) Accuracy: 0.434 +/- 0.112 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.407 MCC: -0.050 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.192 +/- 0.070 (in 3 folds) MCC: 0.043 +/- 0.058 (in 3 folds) Unknown/abstention proportion: 0.531 +/- 0.223 (in 3 folds) Global scores with abstention: Accuracy: 0.194 MCC: -0.006 Unknown/abstention proportion: 0.524 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.37 0.40 0.39 70  Unknown 0.00 0.00 0.00 0  under 50 0.56 0.07 0.13 121  accuracy 0.19 191  macro avg 0.31 0.16 0.17 191 weighted avg 0.49 0.19 0.22 191
,


---

# GeneLocus.BCR, TargetObsColumnEnum.age_group_pediatric_healthy_only trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.813 +/- 0.132 (in 3 folds),0.813 +/- 0.132 (in 3 folds),0.383 +/- 0.206 (in 3 folds),0.383 +/- 0.206 (in 3 folds),0.733 +/- 0.243 (in 3 folds),0.096 +/- 0.167 (in 3 folds),0.819,0.113,0.523 +/- 0.362 (in 3 folds),0.028 +/- 0.040 (in 3 folds),0.363 +/- 0.346 (in 3 folds),0.515,0.064,0.371,Unknown,83.0,49.0,132.0,0.371212,False
linearsvm_ovr,0.762 +/- 0.164 (in 3 folds),0.762 +/- 0.164 (in 3 folds),0.371 +/- 0.174 (in 3 folds),0.371 +/- 0.174 (in 3 folds),0.835 +/- 0.050 (in 3 folds),0.191 +/- 0.251 (in 3 folds),0.837,0.19,0.661 +/- 0.103 (in 3 folds),0.079 +/- 0.077 (in 3 folds),0.211 +/- 0.087 (in 3 folds),0.659,0.1,0.212,Unknown,104.0,28.0,132.0,0.212121,False
xgboost,0.727 +/- 0.017 (in 3 folds),0.727 +/- 0.017 (in 3 folds),0.262 +/- 0.072 (in 3 folds),0.262 +/- 0.072 (in 3 folds),0.815 +/- 0.050 (in 3 folds),0.116 +/- 0.152 (in 3 folds),0.821,0.17,0.587 +/- 0.151 (in 3 folds),0.057 +/- 0.057 (in 3 folds),0.284 +/- 0.142 (in 3 folds),0.591,0.078,0.28,Unknown,95.0,37.0,132.0,0.280303,False
lasso_cv,0.679 +/- 0.044 (in 3 folds),0.679 +/- 0.044 (in 3 folds),0.227 +/- 0.043 (in 3 folds),0.227 +/- 0.043 (in 3 folds),0.733 +/- 0.243 (in 3 folds),0.096 +/- 0.167 (in 3 folds),0.819,0.113,0.523 +/- 0.362 (in 3 folds),0.028 +/- 0.040 (in 3 folds),0.363 +/- 0.346 (in 3 folds),0.515,0.064,0.371,Unknown,83.0,49.0,132.0,0.371212,False
elasticnet_cv,0.679 +/- 0.044 (in 3 folds),0.679 +/- 0.044 (in 3 folds),0.227 +/- 0.043 (in 3 folds),0.227 +/- 0.043 (in 3 folds),0.733 +/- 0.243 (in 3 folds),0.096 +/- 0.167 (in 3 folds),0.819,0.113,0.523 +/- 0.362 (in 3 folds),0.028 +/- 0.040 (in 3 folds),0.363 +/- 0.346 (in 3 folds),0.515,0.064,0.371,Unknown,83.0,49.0,132.0,0.371212,False
lasso_multiclass,0.670 +/- 0.128 (in 2 folds),0.670 +/- 0.128 (in 2 folds),0.251 +/- 0.056 (in 2 folds),0.251 +/- 0.056 (in 2 folds),0.884 +/- 0.110 (in 3 folds),0.060 +/- 0.154 (in 3 folds),0.836,0.171,0.449 +/- 0.363 (in 3 folds),0.059 +/- 0.056 (in 3 folds),0.463 +/- 0.431 (in 3 folds),0.462,0.066,0.447,Unknown,73.0,59.0,132.0,0.44697,False
dummy_stratified,0.595 +/- 0.071 (in 3 folds),0.595 +/- 0.071 (in 3 folds),0.193 +/- 0.071 (in 3 folds),0.193 +/- 0.071 (in 3 folds),0.704 +/- 0.073 (in 3 folds),0.152 +/- 0.101 (in 3 folds),0.716,0.156,0.511 +/- 0.151 (in 3 folds),0.091 +/- 0.042 (in 3 folds),0.284 +/- 0.142 (in 3 folds),0.515,0.093,0.28,Unknown,95.0,37.0,132.0,0.280303,False
rf_multiclass,0.546 +/- 0.069 (in 3 folds),0.546 +/- 0.069 (in 3 folds),0.227 +/- 0.113 (in 3 folds),0.227 +/- 0.113 (in 3 folds),0.852 +/- 0.062 (in 3 folds),0.218 +/- 0.210 (in 3 folds),0.856,0.251,0.676 +/- 0.120 (in 3 folds),0.094 +/- 0.051 (in 3 folds),0.211 +/- 0.087 (in 3 folds),0.674,0.116,0.212,Unknown,104.0,28.0,132.0,0.212121,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.147 +/- 0.043 (in 3 folds),0.147 +/- 0.043 (in 3 folds),0.853 +/- 0.043 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.856,0.0,0.675 +/- 0.106 (in 3 folds),0.012 +/- 0.025 (in 3 folds),0.211 +/- 0.087 (in 3 folds),0.674,0.02,0.212,Unknown,104.0,28.0,132.0,0.212121,True
"All results, sorted",,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.813 +/- 0.132 (in 3 folds),0.813 +/- 0.132 (in 3 folds),0.383 +/- 0.206 (in 3 folds),0.383 +/- 0.206 (in 3 folds),0.733 +/- 0.243 (in 3 folds),0.096 +/- 0.167 (in 3 folds),0.819,0.113,0.523 +/- 0.362 (in 3 folds),0.028 +/- 0.040 (in 3 folds),0.363 +/- 0.346 (in 3 folds),0.515,0.064,0.371,Unknown,83,49,132,0.371212,False
linearsvm_ovr,0.762 +/- 0.164 (in 3 folds),0.762 +/- 0.164 (in 3 folds),0.371 +/- 0.174 (in 3 folds),0.371 +/- 0.174 (in 3 folds),0.835 +/- 0.050 (in 3 folds),0.191 +/- 0.251 (in 3 folds),0.837,0.19,0.661 +/- 0.103 (in 3 folds),0.079 +/- 0.077 (in 3 folds),0.211 +/- 0.087 (in 3 folds),0.659,0.1,0.212,Unknown,104,28,132,0.212121,False
xgboost,0.727 +/- 0.017 (in 3 folds),0.727 +/- 0.017 (in 3 folds),0.262 +/- 0.072 (in 3 folds),0.262 +/- 0.072 (in 3 folds),0.815 +/- 0.050 (in 3 folds),0.116 +/- 0.152 (in 3 folds),0.821,0.17,0.587 +/- 0.151 (in 3 folds),0.057 +/- 0.057 (in 3 folds),0.284 +/- 0.142 (in 3 folds),0.591,0.078,0.28,Unknown,95,37,132,0.280303,False
lasso_cv,0.679 +/- 0.044 (in 3 folds),0.679 +/- 0.044 (in 3 folds),0.227 +/- 0.043 (in 3 folds),0.227 +/- 0.043 (in 3 folds),0.733 +/- 0.243 (in 3 folds),0.096 +/- 0.167 (in 3 folds),0.819,0.113,0.523 +/- 0.362 (in 3 folds),0.028 +/- 0.040 (in 3 folds),0.363 +/- 0.346 (in 3 folds),0.515,0.064,0.371,Unknown,83,49,132,0.371212,False
elasticnet_cv,0.679 +/- 0.044 (in 3 folds),0.679 +/- 0.044 (in 3 folds),0.227 +/- 0.043 (in 3 folds),0.227 +/- 0.043 (in 3 folds),0.733 +/- 0.243 (in 3 folds),0.096 +/- 0.167 (in 3 folds),0.819,0.113,0.523 +/- 0.362 (in 3 folds),0.028 +/- 0.040 (in 3 folds),0.363 +/- 0.346 (in 3 folds),0.515,0.064,0.371,Unknown,83,49,132,0.371212,False
lasso_multiclass,0.670 +/- 0.128 (in 2 folds),0.670 +/- 0.128 (in 2 folds),0.251 +/- 0.056 (in 2 folds),0.251 +/- 0.056 (in 2 folds),0.884 +/- 0.110 (in 3 folds),0.060 +/- 0.154 (in 3 folds),0.836,0.171,0.449 +/- 0.363 (in 3 folds),0.059 +/- 0.056 (in 3 folds),0.463 +/- 0.431 (in 3 folds),0.462,0.066,0.447,Unknown,73,59,132,0.44697,False
dummy_stratified,0.595 +/- 0.071 (in 3 folds),0.595 +/- 0.071 (in 3 folds),0.193 +/- 0.071 (in 3 folds),0.193 +/- 0.071 (in 3 folds),0.704 +/- 0.073 (in 3 folds),0.152 +/- 0.101 (in 3 folds),0.716,0.156,0.511 +/- 0.151 (in 3 folds),0.091 +/- 0.042 (in 3 folds),0.284 +/- 0.142 (in 3 folds),0.515,0.093,0.28,Unknown,95,37,132,0.280303,False
rf_multiclass,0.546 +/- 0.069 (in 3 folds),0.546 +/- 0.069 (in 3 folds),0.227 +/- 0.113 (in 3 folds),0.227 +/- 0.113 (in 3 folds),0.852 +/- 0.062 (in 3 folds),0.218 +/- 0.210 (in 3 folds),0.856,0.251,0.676 +/- 0.120 (in 3 folds),0.094 +/- 0.051 (in 3 folds),0.211 +/- 0.087 (in 3 folds),0.674,0.116,0.212,Unknown,104,28,132,0.212121,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.147 +/- 0.043 (in 3 folds),0.147 +/- 0.043 (in 3 folds),0.853 +/- 0.043 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.856,0.0,0.675 +/- 0.106 (in 3 folds),0.012 +/- 0.025 (in 3 folds),0.211 +/- 0.087 (in 3 folds),0.674,0.02,0.212,Unknown,104,28,132,0.212121,True


ridge_cv,linearsvm_ovr,xgboost,lasso_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.813 +/- 0.132 (in 3 folds) ROC-AUC (macro OvO): 0.813 +/- 0.132 (in 3 folds) au-PRC (weighted OvO): 0.383 +/- 0.206 (in 3 folds) au-PRC (macro OvO): 0.383 +/- 0.206 (in 3 folds) Accuracy: 0.733 +/- 0.243 (in 3 folds) MCC: 0.096 +/- 0.167 (in 3 folds) Global scores without abstention: Accuracy: 0.819 MCC: 0.113 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.523 +/- 0.362 (in 3 folds) MCC: 0.028 +/- 0.040 (in 3 folds) Unknown/abstention proportion: 0.363 +/- 0.346 (in 3 folds) Global scores with abstention: Accuracy: 0.515 MCC: 0.064 Unknown/abstention proportion: 0.371 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.88 0.59 0.71 112  Unknown 0.00 0.00 0.00 0  under 18 0.25 0.10 0.14 20  accuracy 0.52 132  macro avg 0.38 0.23 0.28 132 weighted avg 0.78 0.52 0.62 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.762 +/- 0.164 (in 3 folds) ROC-AUC (macro OvO): 0.762 +/- 0.164 (in 3 folds) au-PRC (weighted OvO): 0.371 +/- 0.174 (in 3 folds) au-PRC (macro OvO): 0.371 +/- 0.174 (in 3 folds) Accuracy: 0.835 +/- 0.050 (in 3 folds) MCC: 0.191 +/- 0.251 (in 3 folds) Global scores without abstention: Accuracy: 0.837 MCC: 0.190 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.661 +/- 0.103 (in 3 folds) MCC: 0.079 +/- 0.077 (in 3 folds) Unknown/abstention proportion: 0.211 +/- 0.087 (in 3 folds) Global scores with abstention: Accuracy: 0.659 MCC: 0.100 Unknown/abstention proportion: 0.212 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.88 0.75 0.81 112  Unknown 0.00 0.00 0.00 0  under 18 0.38 0.15 0.21 20  accuracy 0.66 132  macro avg 0.42 0.30 0.34 132 weighted avg 0.80 0.66 0.72 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.727 +/- 0.017 (in 3 folds) ROC-AUC (macro OvO): 0.727 +/- 0.017 (in 3 folds) au-PRC (weighted OvO): 0.262 +/- 0.072 (in 3 folds) au-PRC (macro OvO): 0.262 +/- 0.072 (in 3 folds) Accuracy: 0.815 +/- 0.050 (in 3 folds) MCC: 0.116 +/- 0.152 (in 3 folds) Global scores without abstention: Accuracy: 0.821 MCC: 0.170 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.587 +/- 0.151 (in 3 folds) MCC: 0.057 +/- 0.057 (in 3 folds) Unknown/abstention proportion: 0.284 +/- 0.142 (in 3 folds) Global scores with abstention: Accuracy: 0.591 MCC: 0.078 Unknown/abstention proportion: 0.280 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.87 0.67 0.76 112  Unknown 0.00 0.00 0.00 0  under 18 0.33 0.15 0.21 20  accuracy 0.59 132  macro avg 0.40 0.27 0.32 132 weighted avg 0.79 0.59 0.67 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.679 +/- 0.044 (in 3 folds) ROC-AUC (macro OvO): 0.679 +/- 0.044 (in 3 folds) au-PRC (weighted OvO): 0.227 +/- 0.043 (in 3 folds) au-PRC (macro OvO): 0.227 +/- 0.043 (in 3 folds) Accuracy: 0.733 +/- 0.243 (in 3 folds) MCC: 0.096 +/- 0.167 (in 3 folds) Global scores without abstention: Accuracy: 0.819 MCC: 0.113 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.523 +/- 0.362 (in 3 folds) MCC: 0.028 +/- 0.040 (in 3 folds) Unknown/abstention proportion: 0.363 +/- 0.346 (in 3 folds) Global scores with abstention: Accuracy: 0.515 MCC: 0.064 Unknown/abstention proportion: 0.371 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.88 0.59 0.71 112  Unknown 0.00 0.00 0.00 0  under 18 0.25 0.10 0.14 20  accuracy 0.52 132  macro avg 0.38 0.23 0.28 132 weighted avg 0.78 0.52 0.62 132
,,,


elasticnet_cv,lasso_multiclass,dummy_stratified,rf_multiclass
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.679 +/- 0.044 (in 3 folds) ROC-AUC (macro OvO): 0.679 +/- 0.044 (in 3 folds) au-PRC (weighted OvO): 0.227 +/- 0.043 (in 3 folds) au-PRC (macro OvO): 0.227 +/- 0.043 (in 3 folds) Accuracy: 0.733 +/- 0.243 (in 3 folds) MCC: 0.096 +/- 0.167 (in 3 folds) Global scores without abstention: Accuracy: 0.819 MCC: 0.113 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.523 +/- 0.362 (in 3 folds) MCC: 0.028 +/- 0.040 (in 3 folds) Unknown/abstention proportion: 0.363 +/- 0.346 (in 3 folds) Global scores with abstention: Accuracy: 0.515 MCC: 0.064 Unknown/abstention proportion: 0.371 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.88 0.59 0.71 112  Unknown 0.00 0.00 0.00 0  under 18 0.25 0.10 0.14 20  accuracy 0.52 132  macro avg 0.38 0.23 0.28 132 weighted avg 0.78 0.52 0.62 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.670 +/- 0.128 (in 2 folds) ROC-AUC (macro OvO): 0.670 +/- 0.128 (in 2 folds) au-PRC (weighted OvO): 0.251 +/- 0.056 (in 2 folds) au-PRC (macro OvO): 0.251 +/- 0.056 (in 2 folds) Accuracy: 0.884 +/- 0.110 (in 3 folds) MCC: 0.060 +/- 0.154 (in 3 folds) Global scores without abstention: Accuracy: 0.836 MCC: 0.171 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.449 +/- 0.363 (in 3 folds) MCC: 0.059 +/- 0.056 (in 3 folds) Unknown/abstention proportion: 0.463 +/- 0.431 (in 3 folds) Global scores with abstention: Accuracy: 0.462 MCC: 0.066 Unknown/abstention proportion: 0.447 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.88 0.53 0.66 112  Unknown 0.00 0.00 0.00 0  under 18 0.33 0.10 0.15 20  accuracy 0.46 132  macro avg 0.40 0.21 0.27 132 weighted avg 0.80 0.46 0.58 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.595 +/- 0.071 (in 3 folds) ROC-AUC (macro OvO): 0.595 +/- 0.071 (in 3 folds) au-PRC (weighted OvO): 0.193 +/- 0.071 (in 3 folds) au-PRC (macro OvO): 0.193 +/- 0.071 (in 3 folds) Accuracy: 0.704 +/- 0.073 (in 3 folds) MCC: 0.152 +/- 0.101 (in 3 folds) Global scores without abstention: Accuracy: 0.716 MCC: 0.156 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.511 +/- 0.151 (in 3 folds) MCC: 0.091 +/- 0.042 (in 3 folds) Unknown/abstention proportion: 0.284 +/- 0.142 (in 3 folds) Global scores with abstention: Accuracy: 0.515 MCC: 0.093 Unknown/abstention proportion: 0.280 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.89 0.55 0.68 112  Unknown 0.00 0.00 0.00 0  under 18 0.24 0.30 0.27 20  accuracy 0.52 132  macro avg 0.38 0.28 0.32 132 weighted avg 0.79 0.52 0.62 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.546 +/- 0.069 (in 3 folds) ROC-AUC (macro OvO): 0.546 +/- 0.069 (in 3 folds) au-PRC (weighted OvO): 0.227 +/- 0.113 (in 3 folds) au-PRC (macro OvO): 0.227 +/- 0.113 (in 3 folds) Accuracy: 0.852 +/- 0.062 (in 3 folds) MCC: 0.218 +/- 0.210 (in 3 folds) Global scores without abstention: Accuracy: 0.856 MCC: 0.251 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.676 +/- 0.120 (in 3 folds) MCC: 0.094 +/- 0.051 (in 3 folds) Unknown/abstention proportion: 0.211 +/- 0.087 (in 3 folds) Global scores with abstention: Accuracy: 0.674 MCC: 0.116 Unknown/abstention proportion: 0.212 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.88 0.77 0.82 112  Unknown 0.00 0.00 0.00 0  under 18 0.50 0.15 0.23 20  accuracy 0.67 132  macro avg 0.46 0.31 0.35 132 weighted avg 0.82 0.67 0.73 132
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.147 +/- 0.043 (in 3 folds) au-PRC (macro OvO): 0.147 +/- 0.043 (in 3 folds) Accuracy: 0.853 +/- 0.043 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.856 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.675 +/- 0.106 (in 3 folds) MCC: 0.012 +/- 0.025 (in 3 folds) Unknown/abstention proportion: 0.211 +/- 0.087 (in 3 folds) Global scores with abstention: Accuracy: 0.674 MCC: 0.020 Unknown/abstention proportion: 0.212 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.86 0.79 0.82 112  Unknown 0.00 0.00 0.00 0  under 18 0.00 0.00 0.00 20  accuracy 0.67 132  macro avg 0.29 0.26 0.27 132 weighted avg 0.73 0.67 0.70 132


## Apply train-smaller model -- Test set performance - With and without tuning on validation set



---

# GeneLocus.BCR, TargetObsColumnEnum.sex_healthy_only trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
dummy_stratified,0.564 +/- 0.053 (in 3 folds),0.564 +/- 0.053 (in 3 folds),0.514 +/- 0.230 (in 3 folds),0.514 +/- 0.230 (in 3 folds),0.491 +/- 0.101 (in 3 folds),0.135 +/- 0.103 (in 3 folds),0.491,-0.007,0.193 +/- 0.184 (in 3 folds),0.031 +/- 0.073 (in 3 folds),0.605 +/- 0.392 (in 3 folds),0.197,-0.009,0.598,Unknown,53.0,79.0,132.0,0.598485,False
rf_multiclass,0.560 +/- 0.029 (in 3 folds),0.560 +/- 0.029 (in 3 folds),0.568 +/- 0.192 (in 3 folds),0.568 +/- 0.192 (in 3 folds),0.537 +/- 0.059 (in 3 folds),0.194 +/- 0.069 (in 3 folds),0.541,0.078,0.452 +/- 0.130 (in 3 folds),0.128 +/- 0.053 (in 3 folds),0.169 +/- 0.151 (in 3 folds),0.447,0.048,0.174,Unknown,109.0,23.0,132.0,0.174242,False
elasticnet_cv,0.556 +/- 0.069 (in 3 folds),0.556 +/- 0.069 (in 3 folds),0.579 +/- 0.179 (in 3 folds),0.579 +/- 0.179 (in 3 folds),0.537 +/- 0.047 (in 3 folds),0.191 +/- 0.099 (in 3 folds),0.541,0.08,0.451 +/- 0.118 (in 3 folds),0.123 +/- 0.047 (in 3 folds),0.169 +/- 0.151 (in 3 folds),0.447,0.054,0.174,Unknown,109.0,23.0,132.0,0.174242,False
linearsvm_ovr,0.555 +/- 0.063 (in 3 folds),0.555 +/- 0.063 (in 3 folds),0.537 +/- 0.157 (in 3 folds),0.537 +/- 0.157 (in 3 folds),0.580 +/- 0.009 (in 3 folds),0.173 +/- 0.064 (in 3 folds),0.581,0.15,0.546 +/- 0.041 (in 3 folds),0.156 +/- 0.062 (in 3 folds),0.059 +/- 0.062 (in 3 folds),0.545,0.134,0.061,Unknown,124.0,8.0,132.0,0.060606,False
lasso_multiclass,0.554 +/- 0.058 (in 3 folds),0.554 +/- 0.058 (in 3 folds),0.536 +/- 0.148 (in 3 folds),0.536 +/- 0.148 (in 3 folds),0.556 +/- 0.027 (in 3 folds),0.123 +/- 0.099 (in 3 folds),0.556,0.098,0.523 +/- 0.029 (in 3 folds),0.110 +/- 0.084 (in 3 folds),0.059 +/- 0.062 (in 3 folds),0.523,0.087,0.061,Unknown,124.0,8.0,132.0,0.060606,False
lasso_cv,0.547 +/- 0.084 (in 3 folds),0.547 +/- 0.084 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.521 +/- 0.130 (in 3 folds),0.240 +/- 0.079 (in 3 folds),0.49,-0.014,0.376 +/- 0.087 (in 3 folds),0.147 +/- 0.021 (in 3 folds),0.238 +/- 0.267 (in 3 folds),0.379,0.002,0.227,Unknown,102.0,30.0,132.0,0.227273,False
ridge_cv,0.533 +/- 0.084 (in 3 folds),0.533 +/- 0.084 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.471 +/- 0.120 (in 3 folds),0.102 +/- 0.176 (in 3 folds),0.451,-0.1,0.346 +/- 0.113 (in 3 folds),0.092 +/- 0.064 (in 3 folds),0.238 +/- 0.267 (in 3 folds),0.348,-0.046,0.227,Unknown,102.0,30.0,132.0,0.227273,False
xgboost,0.515 +/- 0.065 (in 3 folds),0.515 +/- 0.065 (in 3 folds),0.633 +/- 0.165 (in 3 folds),0.633 +/- 0.165 (in 3 folds),0.609 +/- 0.050 (in 3 folds),0.108 +/- 0.101 (in 3 folds),0.59,0.191,0.356 +/- 0.216 (in 3 folds),0.136 +/- 0.039 (in 3 folds),0.395 +/- 0.391 (in 3 folds),0.348,0.09,0.409,Unknown,78.0,54.0,132.0,0.409091,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.628 +/- 0.088 (in 3 folds),0.628 +/- 0.088 (in 3 folds),0.628 +/- 0.088 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.632,0.0,0.273 +/- 0.159 (in 3 folds),0.120 +/- 0.060 (in 3 folds),0.565 +/- 0.226 (in 3 folds),0.273,0.148,0.568,Unknown,57.0,75.0,132.0,0.568182,True
"All results, sorted",,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
dummy_stratified,0.564 +/- 0.053 (in 3 folds),0.564 +/- 0.053 (in 3 folds),0.514 +/- 0.230 (in 3 folds),0.514 +/- 0.230 (in 3 folds),0.491 +/- 0.101 (in 3 folds),0.135 +/- 0.103 (in 3 folds),0.491,-0.007,0.193 +/- 0.184 (in 3 folds),0.031 +/- 0.073 (in 3 folds),0.605 +/- 0.392 (in 3 folds),0.197,-0.009,0.598,Unknown,53,79,132,0.598485,False
rf_multiclass,0.560 +/- 0.029 (in 3 folds),0.560 +/- 0.029 (in 3 folds),0.568 +/- 0.192 (in 3 folds),0.568 +/- 0.192 (in 3 folds),0.537 +/- 0.059 (in 3 folds),0.194 +/- 0.069 (in 3 folds),0.541,0.078,0.452 +/- 0.130 (in 3 folds),0.128 +/- 0.053 (in 3 folds),0.169 +/- 0.151 (in 3 folds),0.447,0.048,0.174,Unknown,109,23,132,0.174242,False
elasticnet_cv,0.556 +/- 0.069 (in 3 folds),0.556 +/- 0.069 (in 3 folds),0.579 +/- 0.179 (in 3 folds),0.579 +/- 0.179 (in 3 folds),0.537 +/- 0.047 (in 3 folds),0.191 +/- 0.099 (in 3 folds),0.541,0.08,0.451 +/- 0.118 (in 3 folds),0.123 +/- 0.047 (in 3 folds),0.169 +/- 0.151 (in 3 folds),0.447,0.054,0.174,Unknown,109,23,132,0.174242,False
linearsvm_ovr,0.555 +/- 0.063 (in 3 folds),0.555 +/- 0.063 (in 3 folds),0.537 +/- 0.157 (in 3 folds),0.537 +/- 0.157 (in 3 folds),0.580 +/- 0.009 (in 3 folds),0.173 +/- 0.064 (in 3 folds),0.581,0.15,0.546 +/- 0.041 (in 3 folds),0.156 +/- 0.062 (in 3 folds),0.059 +/- 0.062 (in 3 folds),0.545,0.134,0.061,Unknown,124,8,132,0.060606,False
lasso_multiclass,0.554 +/- 0.058 (in 3 folds),0.554 +/- 0.058 (in 3 folds),0.536 +/- 0.148 (in 3 folds),0.536 +/- 0.148 (in 3 folds),0.556 +/- 0.027 (in 3 folds),0.123 +/- 0.099 (in 3 folds),0.556,0.098,0.523 +/- 0.029 (in 3 folds),0.110 +/- 0.084 (in 3 folds),0.059 +/- 0.062 (in 3 folds),0.523,0.087,0.061,Unknown,124,8,132,0.060606,False
lasso_cv,0.547 +/- 0.084 (in 3 folds),0.547 +/- 0.084 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.521 +/- 0.130 (in 3 folds),0.240 +/- 0.079 (in 3 folds),0.49,-0.014,0.376 +/- 0.087 (in 3 folds),0.147 +/- 0.021 (in 3 folds),0.238 +/- 0.267 (in 3 folds),0.379,0.002,0.227,Unknown,102,30,132,0.227273,False
ridge_cv,0.533 +/- 0.084 (in 3 folds),0.533 +/- 0.084 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.581 +/- 0.187 (in 3 folds),0.471 +/- 0.120 (in 3 folds),0.102 +/- 0.176 (in 3 folds),0.451,-0.1,0.346 +/- 0.113 (in 3 folds),0.092 +/- 0.064 (in 3 folds),0.238 +/- 0.267 (in 3 folds),0.348,-0.046,0.227,Unknown,102,30,132,0.227273,False
xgboost,0.515 +/- 0.065 (in 3 folds),0.515 +/- 0.065 (in 3 folds),0.633 +/- 0.165 (in 3 folds),0.633 +/- 0.165 (in 3 folds),0.609 +/- 0.050 (in 3 folds),0.108 +/- 0.101 (in 3 folds),0.59,0.191,0.356 +/- 0.216 (in 3 folds),0.136 +/- 0.039 (in 3 folds),0.395 +/- 0.391 (in 3 folds),0.348,0.09,0.409,Unknown,78,54,132,0.409091,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.628 +/- 0.088 (in 3 folds),0.628 +/- 0.088 (in 3 folds),0.628 +/- 0.088 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.632,0.0,0.273 +/- 0.159 (in 3 folds),0.120 +/- 0.060 (in 3 folds),0.565 +/- 0.226 (in 3 folds),0.273,0.148,0.568,Unknown,57,75,132,0.568182,True


dummy_stratified,rf_multiclass,elasticnet_cv,linearsvm_ovr
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.564 +/- 0.053 (in 3 folds) ROC-AUC (macro OvO): 0.564 +/- 0.053 (in 3 folds) au-PRC (weighted OvO): 0.514 +/- 0.230 (in 3 folds) au-PRC (macro OvO): 0.514 +/- 0.230 (in 3 folds) Accuracy: 0.491 +/- 0.101 (in 3 folds) MCC: 0.135 +/- 0.103 (in 3 folds) Global scores without abstention: Accuracy: 0.491 MCC: -0.007 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.193 +/- 0.184 (in 3 folds) MCC: 0.031 +/- 0.073 (in 3 folds) Unknown/abstention proportion: 0.605 +/- 0.392 (in 3 folds) Global scores with abstention: Accuracy: 0.197 MCC: -0.009 Unknown/abstention proportion: 0.598 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.39 0.15 0.22 71  M 0.60 0.25 0.35 61  Unknown 0.00 0.00 0.00 0  accuracy 0.20 132  macro avg 0.33 0.13 0.19 132 weighted avg 0.49 0.20 0.28 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.560 +/- 0.029 (in 3 folds) ROC-AUC (macro OvO): 0.560 +/- 0.029 (in 3 folds) au-PRC (weighted OvO): 0.568 +/- 0.192 (in 3 folds) au-PRC (macro OvO): 0.568 +/- 0.192 (in 3 folds) Accuracy: 0.537 +/- 0.059 (in 3 folds) MCC: 0.194 +/- 0.069 (in 3 folds) Global scores without abstention: Accuracy: 0.541 MCC: 0.078 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.452 +/- 0.130 (in 3 folds) MCC: 0.128 +/- 0.053 (in 3 folds) Unknown/abstention proportion: 0.169 +/- 0.151 (in 3 folds) Global scores with abstention: Accuracy: 0.447 MCC: 0.048 Unknown/abstention proportion: 0.174 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.54 0.52 0.53 71  M 0.54 0.36 0.43 61  Unknown 0.00 0.00 0.00 0  accuracy 0.45 132  macro avg 0.36 0.29 0.32 132 weighted avg 0.54 0.45 0.49 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.556 +/- 0.069 (in 3 folds) ROC-AUC (macro OvO): 0.556 +/- 0.069 (in 3 folds) au-PRC (weighted OvO): 0.579 +/- 0.179 (in 3 folds) au-PRC (macro OvO): 0.579 +/- 0.179 (in 3 folds) Accuracy: 0.537 +/- 0.047 (in 3 folds) MCC: 0.191 +/- 0.099 (in 3 folds) Global scores without abstention: Accuracy: 0.541 MCC: 0.080 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.451 +/- 0.118 (in 3 folds) MCC: 0.123 +/- 0.047 (in 3 folds) Unknown/abstention proportion: 0.169 +/- 0.151 (in 3 folds) Global scores with abstention: Accuracy: 0.447 MCC: 0.054 Unknown/abstention proportion: 0.174 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.55 0.48 0.51 71  M 0.53 0.41 0.46 61  Unknown 0.00 0.00 0.00 0  accuracy 0.45 132  macro avg 0.36 0.30 0.32 132 weighted avg 0.54 0.45 0.49 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.555 +/- 0.063 (in 3 folds) ROC-AUC (macro OvO): 0.555 +/- 0.063 (in 3 folds) au-PRC (weighted OvO): 0.537 +/- 0.157 (in 3 folds) au-PRC (macro OvO): 0.537 +/- 0.157 (in 3 folds) Accuracy: 0.580 +/- 0.009 (in 3 folds) MCC: 0.173 +/- 0.064 (in 3 folds) Global scores without abstention: Accuracy: 0.581 MCC: 0.150 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.546 +/- 0.041 (in 3 folds) MCC: 0.156 +/- 0.062 (in 3 folds) Unknown/abstention proportion: 0.059 +/- 0.062 (in 3 folds) Global scores with abstention: Accuracy: 0.545 MCC: 0.134 Unknown/abstention proportion: 0.061 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.60 0.62 0.61 71  M 0.55 0.46 0.50 61  Unknown 0.00 0.00 0.00 0  accuracy 0.55 132  macro avg 0.38 0.36 0.37 132 weighted avg 0.58 0.55 0.56 132
,,,


lasso_multiclass,lasso_cv,ridge_cv,xgboost
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.554 +/- 0.058 (in 3 folds) ROC-AUC (macro OvO): 0.554 +/- 0.058 (in 3 folds) au-PRC (weighted OvO): 0.536 +/- 0.148 (in 3 folds) au-PRC (macro OvO): 0.536 +/- 0.148 (in 3 folds) Accuracy: 0.556 +/- 0.027 (in 3 folds) MCC: 0.123 +/- 0.099 (in 3 folds) Global scores without abstention: Accuracy: 0.556 MCC: 0.098 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.523 +/- 0.029 (in 3 folds) MCC: 0.110 +/- 0.084 (in 3 folds) Unknown/abstention proportion: 0.059 +/- 0.062 (in 3 folds) Global scores with abstention: Accuracy: 0.523 MCC: 0.087 Unknown/abstention proportion: 0.061 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.58 0.62 0.60 71  M 0.52 0.41 0.46 61  Unknown 0.00 0.00 0.00 0  accuracy 0.52 132  macro avg 0.37 0.34 0.35 132 weighted avg 0.55 0.52 0.53 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.547 +/- 0.084 (in 3 folds) ROC-AUC (macro OvO): 0.547 +/- 0.084 (in 3 folds) au-PRC (weighted OvO): 0.581 +/- 0.187 (in 3 folds) au-PRC (macro OvO): 0.581 +/- 0.187 (in 3 folds) Accuracy: 0.521 +/- 0.130 (in 3 folds) MCC: 0.240 +/- 0.079 (in 3 folds) Global scores without abstention: Accuracy: 0.490 MCC: -0.014 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.376 +/- 0.087 (in 3 folds) MCC: 0.147 +/- 0.021 (in 3 folds) Unknown/abstention proportion: 0.238 +/- 0.267 (in 3 folds) Global scores with abstention: Accuracy: 0.379 MCC: 0.002 Unknown/abstention proportion: 0.227 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.50 0.25 0.34 71  M 0.48 0.52 0.50 61  Unknown 0.00 0.00 0.00 0  accuracy 0.38 132  macro avg 0.33 0.26 0.28 132 weighted avg 0.49 0.38 0.41 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.533 +/- 0.084 (in 3 folds) ROC-AUC (macro OvO): 0.533 +/- 0.084 (in 3 folds) au-PRC (weighted OvO): 0.581 +/- 0.187 (in 3 folds) au-PRC (macro OvO): 0.581 +/- 0.187 (in 3 folds) Accuracy: 0.471 +/- 0.120 (in 3 folds) MCC: 0.102 +/- 0.176 (in 3 folds) Global scores without abstention: Accuracy: 0.451 MCC: -0.100 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.346 +/- 0.113 (in 3 folds) MCC: 0.092 +/- 0.064 (in 3 folds) Unknown/abstention proportion: 0.238 +/- 0.267 (in 3 folds) Global scores with abstention: Accuracy: 0.348 MCC: -0.046 Unknown/abstention proportion: 0.227 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.43 0.17 0.24 71  M 0.46 0.56 0.50 61  Unknown 0.00 0.00 0.00 0  accuracy 0.35 132  macro avg 0.30 0.24 0.25 132 weighted avg 0.44 0.35 0.36 132,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.515 +/- 0.065 (in 3 folds) ROC-AUC (macro OvO): 0.515 +/- 0.065 (in 3 folds) au-PRC (weighted OvO): 0.633 +/- 0.165 (in 3 folds) au-PRC (macro OvO): 0.633 +/- 0.165 (in 3 folds) Accuracy: 0.609 +/- 0.050 (in 3 folds) MCC: 0.108 +/- 0.101 (in 3 folds) Global scores without abstention: Accuracy: 0.590 MCC: 0.191 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.356 +/- 0.216 (in 3 folds) MCC: 0.136 +/- 0.039 (in 3 folds) Unknown/abstention proportion: 0.395 +/- 0.391 (in 3 folds) Global scores with abstention: Accuracy: 0.348 MCC: 0.090 Unknown/abstention proportion: 0.409 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.52 0.31 0.39 71  M 0.67 0.39 0.49 61  Unknown 0.00 0.00 0.00 0  accuracy 0.35 132  macro avg 0.40 0.23 0.29 132 weighted avg 0.59 0.35 0.44 132
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.628 +/- 0.088 (in 3 folds) au-PRC (macro OvO): 0.628 +/- 0.088 (in 3 folds) Accuracy: 0.628 +/- 0.088 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.632 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.273 +/- 0.159 (in 3 folds) MCC: 0.120 +/- 0.060 (in 3 folds) Unknown/abstention proportion: 0.565 +/- 0.226 (in 3 folds) Global scores with abstention: Accuracy: 0.273 MCC: 0.148 Unknown/abstention proportion: 0.568 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.00 0.00 0.00 71  M 0.63 0.59 0.61 61  Unknown 0.00 0.00 0.00 0  accuracy 0.27 132  macro avg 0.21 0.20 0.20 132 weighted avg 0.29 0.27 0.28 132


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.549 +/- 0.090 (in 3 folds),0.549 +/- 0.090 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.553 +/- 0.073 (in 3 folds),0.082 +/- 0.156 (in 3 folds),0.542,0.075,0.470 +/- 0.019 (in 3 folds),0.048 +/- 0.097 (in 3 folds),0.138 +/- 0.142 (in 3 folds),,,,,0.471,0.062,0.131,Unknown,166.0,25.0,191.0,0.13089,False
elasticnet_cv.decision_thresholds_tuned,0.549 +/- 0.090 (in 3 folds),0.549 +/- 0.090 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.496 +/- 0.035 (in 3 folds),-0.021 +/- 0.049 (in 3 folds),0.5,-0.04,0.430 +/- 0.089 (in 3 folds),-0.010 +/- 0.057 (in 3 folds),0.138 +/- 0.142 (in 3 folds),,,,,0.435,-0.018,0.131,Unknown,166.0,25.0,191.0,0.13089,False
lasso_multiclass,0.545 +/- 0.054 (in 3 folds),0.545 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.546 +/- 0.040 (in 3 folds),0.086 +/- 0.109 (in 3 folds),0.543,0.081,0.530 +/- 0.019 (in 3 folds),0.075 +/- 0.094 (in 3 folds),0.042 +/- 0.038 (in 2 folds),0.542 +/- 0.000 (in 1 folds),0.542 +/- 0.000 (in 1 folds),0.536 +/- 0.000 (in 1 folds),0.536 +/- 0.000 (in 1 folds),0.529,0.076,0.026,Unknown,186.0,5.0,191.0,0.026178,False
lasso_multiclass.decision_thresholds_tuned,0.545 +/- 0.054 (in 3 folds),0.545 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.490 +/- 0.063 (in 3 folds),-0.039 +/- 0.134 (in 3 folds),0.495,-0.027,0.478 +/- 0.078 (in 3 folds),-0.016 +/- 0.107 (in 3 folds),0.042 +/- 0.038 (in 2 folds),0.542 +/- 0.000 (in 1 folds),0.542 +/- 0.000 (in 1 folds),0.536 +/- 0.000 (in 1 folds),0.536 +/- 0.000 (in 1 folds),0.482,-0.027,0.026,Unknown,186.0,5.0,191.0,0.026178,False
rf_multiclass,0.542 +/- 0.082 (in 3 folds),0.542 +/- 0.082 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.559 +/- 0.071 (in 3 folds),0.096 +/- 0.157 (in 3 folds),0.548,0.089,0.475 +/- 0.024 (in 3 folds),0.056 +/- 0.105 (in 3 folds),0.138 +/- 0.142 (in 3 folds),,,,,0.476,0.072,0.131,Unknown,166.0,25.0,191.0,0.13089,False
rf_multiclass.decision_thresholds_tuned,0.542 +/- 0.082 (in 3 folds),0.542 +/- 0.082 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.534 +/- 0.042 (in 3 folds),0.090 +/- 0.086 (in 3 folds),0.536,0.047,0.461 +/- 0.087 (in 3 folds),0.060 +/- 0.066 (in 3 folds),0.138 +/- 0.142 (in 3 folds),,,,,0.466,0.046,0.131,Unknown,166.0,25.0,191.0,0.13089,False
linearsvm_ovr,0.532 +/- 0.072 (in 3 folds),0.532 +/- 0.072 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.541 +/- 0.050 (in 3 folds),0.081 +/- 0.125 (in 3 folds),0.538,0.071,0.525 +/- 0.035 (in 3 folds),0.072 +/- 0.111 (in 3 folds),0.042 +/- 0.038 (in 2 folds),0.540 +/- 0.000 (in 1 folds),0.540 +/- 0.000 (in 1 folds),0.537 +/- 0.000 (in 1 folds),0.537 +/- 0.000 (in 1 folds),0.524,0.067,0.026,Unknown,186.0,5.0,191.0,0.026178,False
linearsvm_ovr.decision_thresholds_tuned,0.532 +/- 0.072 (in 3 folds),0.532 +/- 0.072 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.485 +/- 0.056 (in 3 folds),-0.031 +/- 0.125 (in 3 folds),0.489,-0.031,0.473 +/- 0.071 (in 3 folds),-0.008 +/- 0.093 (in 3 folds),0.042 +/- 0.038 (in 2 folds),0.540 +/- 0.000 (in 1 folds),0.540 +/- 0.000 (in 1 folds),0.537 +/- 0.000 (in 1 folds),0.537 +/- 0.000 (in 1 folds),0.476,-0.03,0.026,Unknown,186.0,5.0,191.0,0.026178,False
ridge_cv,0.488 +/- 0.030 (in 3 folds),0.488 +/- 0.030 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.548 +/- 0.014 (in 3 folds),0.009 +/- 0.015 (in 3 folds),0.547,0.092,0.429 +/- 0.153 (in 3 folds),0.069 +/- 0.037 (in 3 folds),0.217 +/- 0.275 (in 3 folds),,,,,0.424,0.078,0.225,Unknown,148.0,43.0,191.0,0.225131,False
ridge_cv.decision_thresholds_tuned,0.488 +/- 0.030 (in 3 folds),0.488 +/- 0.030 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.479 +/- 0.060 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.466,-0.076,0.364 +/- 0.093 (in 3 folds),-0.002 +/- 0.093 (in 3 folds),0.217 +/- 0.275 (in 3 folds),,,,,0.361,-0.041,0.225,Unknown,148.0,43.0,191.0,0.225131,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.549 +/- 0.090 (in 3 folds),0.549 +/- 0.090 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.553 +/- 0.073 (in 3 folds),0.082 +/- 0.156 (in 3 folds),0.542,0.075,0.470 +/- 0.019 (in 3 folds),0.048 +/- 0.097 (in 3 folds),0.138 +/- 0.142 (in 3 folds),,,,,0.471,0.062,0.131,Unknown,166,25,191,0.13089,False
elasticnet_cv.decision_thresholds_tuned,0.549 +/- 0.090 (in 3 folds),0.549 +/- 0.090 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.551 +/- 0.093 (in 3 folds),0.496 +/- 0.035 (in 3 folds),-0.021 +/- 0.049 (in 3 folds),0.5,-0.04,0.430 +/- 0.089 (in 3 folds),-0.010 +/- 0.057 (in 3 folds),0.138 +/- 0.142 (in 3 folds),,,,,0.435,-0.018,0.131,Unknown,166,25,191,0.13089,False
lasso_multiclass,0.545 +/- 0.054 (in 3 folds),0.545 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.546 +/- 0.040 (in 3 folds),0.086 +/- 0.109 (in 3 folds),0.543,0.081,0.530 +/- 0.019 (in 3 folds),0.075 +/- 0.094 (in 3 folds),0.042 +/- 0.038 (in 2 folds),0.542 +/- 0.000 (in 1 folds),0.542 +/- 0.000 (in 1 folds),0.536 +/- 0.000 (in 1 folds),0.536 +/- 0.000 (in 1 folds),0.529,0.076,0.026,Unknown,186,5,191,0.026178,False
lasso_multiclass.decision_thresholds_tuned,0.545 +/- 0.054 (in 3 folds),0.545 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.561 +/- 0.054 (in 3 folds),0.490 +/- 0.063 (in 3 folds),-0.039 +/- 0.134 (in 3 folds),0.495,-0.027,0.478 +/- 0.078 (in 3 folds),-0.016 +/- 0.107 (in 3 folds),0.042 +/- 0.038 (in 2 folds),0.542 +/- 0.000 (in 1 folds),0.542 +/- 0.000 (in 1 folds),0.536 +/- 0.000 (in 1 folds),0.536 +/- 0.000 (in 1 folds),0.482,-0.027,0.026,Unknown,186,5,191,0.026178,False
rf_multiclass,0.542 +/- 0.082 (in 3 folds),0.542 +/- 0.082 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.559 +/- 0.071 (in 3 folds),0.096 +/- 0.157 (in 3 folds),0.548,0.089,0.475 +/- 0.024 (in 3 folds),0.056 +/- 0.105 (in 3 folds),0.138 +/- 0.142 (in 3 folds),,,,,0.476,0.072,0.131,Unknown,166,25,191,0.13089,False
rf_multiclass.decision_thresholds_tuned,0.542 +/- 0.082 (in 3 folds),0.542 +/- 0.082 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.522 +/- 0.099 (in 3 folds),0.534 +/- 0.042 (in 3 folds),0.090 +/- 0.086 (in 3 folds),0.536,0.047,0.461 +/- 0.087 (in 3 folds),0.060 +/- 0.066 (in 3 folds),0.138 +/- 0.142 (in 3 folds),,,,,0.466,0.046,0.131,Unknown,166,25,191,0.13089,False
linearsvm_ovr,0.532 +/- 0.072 (in 3 folds),0.532 +/- 0.072 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.541 +/- 0.050 (in 3 folds),0.081 +/- 0.125 (in 3 folds),0.538,0.071,0.525 +/- 0.035 (in 3 folds),0.072 +/- 0.111 (in 3 folds),0.042 +/- 0.038 (in 2 folds),0.540 +/- 0.000 (in 1 folds),0.540 +/- 0.000 (in 1 folds),0.537 +/- 0.000 (in 1 folds),0.537 +/- 0.000 (in 1 folds),0.524,0.067,0.026,Unknown,186,5,191,0.026178,False
linearsvm_ovr.decision_thresholds_tuned,0.532 +/- 0.072 (in 3 folds),0.532 +/- 0.072 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.554 +/- 0.062 (in 3 folds),0.485 +/- 0.056 (in 3 folds),-0.031 +/- 0.125 (in 3 folds),0.489,-0.031,0.473 +/- 0.071 (in 3 folds),-0.008 +/- 0.093 (in 3 folds),0.042 +/- 0.038 (in 2 folds),0.540 +/- 0.000 (in 1 folds),0.540 +/- 0.000 (in 1 folds),0.537 +/- 0.000 (in 1 folds),0.537 +/- 0.000 (in 1 folds),0.476,-0.03,0.026,Unknown,186,5,191,0.026178,False
ridge_cv,0.488 +/- 0.030 (in 3 folds),0.488 +/- 0.030 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.548 +/- 0.014 (in 3 folds),0.009 +/- 0.015 (in 3 folds),0.547,0.092,0.429 +/- 0.153 (in 3 folds),0.069 +/- 0.037 (in 3 folds),0.217 +/- 0.275 (in 3 folds),,,,,0.424,0.078,0.225,Unknown,148,43,191,0.225131,False
ridge_cv.decision_thresholds_tuned,0.488 +/- 0.030 (in 3 folds),0.488 +/- 0.030 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.544 +/- 0.069 (in 3 folds),0.479 +/- 0.060 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.466,-0.076,0.364 +/- 0.093 (in 3 folds),-0.002 +/- 0.093 (in 3 folds),0.217 +/- 0.275 (in 3 folds),,,,,0.361,-0.041,0.225,Unknown,148,43,191,0.225131,False


elasticnet_cv,elasticnet_cv.decision_thresholds_tuned,lasso_multiclass,lasso_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.549 +/- 0.090 (in 3 folds) ROC-AUC (macro OvO): 0.549 +/- 0.090 (in 3 folds) au-PRC (weighted OvO): 0.551 +/- 0.093 (in 3 folds) au-PRC (macro OvO): 0.551 +/- 0.093 (in 3 folds) Accuracy: 0.553 +/- 0.073 (in 3 folds) MCC: 0.082 +/- 0.156 (in 3 folds) Global scores without abstention: Accuracy: 0.542 MCC: 0.075 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.470 +/- 0.019 (in 3 folds) MCC: 0.048 +/- 0.097 (in 3 folds) Unknown/abstention proportion: 0.138 +/- 0.142 (in 3 folds) Global scores with abstention: Accuracy: 0.471 MCC: 0.062 Unknown/abstention proportion: 0.131 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.56 0.56 0.56 99  M 0.51 0.38 0.44 92  Unknown 0.00 0.00 0.00 0  accuracy 0.47 191  macro avg 0.36 0.31 0.33 191 weighted avg 0.54 0.47 0.50 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.549 +/- 0.090 (in 3 folds) ROC-AUC (macro OvO): 0.549 +/- 0.090 (in 3 folds) au-PRC (weighted OvO): 0.551 +/- 0.093 (in 3 folds) au-PRC (macro OvO): 0.551 +/- 0.093 (in 3 folds) Accuracy: 0.496 +/- 0.035 (in 3 folds) MCC: -0.021 +/- 0.049 (in 3 folds) Global scores without abstention: Accuracy: 0.500 MCC: -0.040 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.430 +/- 0.089 (in 3 folds) MCC: -0.010 +/- 0.057 (in 3 folds) Unknown/abstention proportion: 0.138 +/- 0.142 (in 3 folds) Global scores with abstention: Accuracy: 0.435 MCC: -0.018 Unknown/abstention proportion: 0.131 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.52 0.68 0.59 99  M 0.43 0.17 0.25 92  Unknown 0.00 0.00 0.00 0  accuracy 0.43 191  macro avg 0.32 0.28 0.28 191 weighted avg 0.48 0.43 0.42 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.545 +/- 0.054 (in 3 folds) ROC-AUC (macro OvO): 0.545 +/- 0.054 (in 3 folds) au-PRC (weighted OvO): 0.561 +/- 0.054 (in 3 folds) au-PRC (macro OvO): 0.561 +/- 0.054 (in 3 folds) Accuracy: 0.546 +/- 0.040 (in 3 folds) MCC: 0.086 +/- 0.109 (in 3 folds) Global scores without abstention: Accuracy: 0.543 MCC: 0.081 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.530 +/- 0.019 (in 3 folds) MCC: 0.075 +/- 0.094 (in 3 folds) Unknown/abstention proportion: 0.042 +/- 0.038 (in 2 folds) ROC-AUC (weighted OvO): 0.542 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.542 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.536 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.536 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.529 MCC: 0.076 Unknown/abstention proportion: 0.026 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.55 0.63 0.58 99  M 0.53 0.42 0.47 92  Unknown 0.00 0.00 0.00 0  accuracy 0.53 191  macro avg 0.36 0.35 0.35 191 weighted avg 0.54 0.53 0.53 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.545 +/- 0.054 (in 3 folds) ROC-AUC (macro OvO): 0.545 +/- 0.054 (in 3 folds) au-PRC (weighted OvO): 0.561 +/- 0.054 (in 3 folds) au-PRC (macro OvO): 0.561 +/- 0.054 (in 3 folds) Accuracy: 0.490 +/- 0.063 (in 3 folds) MCC: -0.039 +/- 0.134 (in 3 folds) Global scores without abstention: Accuracy: 0.495 MCC: -0.027 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.478 +/- 0.078 (in 3 folds) MCC: -0.016 +/- 0.107 (in 3 folds) Unknown/abstention proportion: 0.042 +/- 0.038 (in 2 folds) ROC-AUC (weighted OvO): 0.542 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.542 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.536 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.536 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.482 MCC: -0.027 Unknown/abstention proportion: 0.026 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.51 0.68 0.58 99  M 0.46 0.27 0.34 92  Unknown 0.00 0.00 0.00 0  accuracy 0.48 191  macro avg 0.32 0.32 0.31 191 weighted avg 0.49 0.48 0.47 191
,,,


rf_multiclass,rf_multiclass.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.542 +/- 0.082 (in 3 folds) ROC-AUC (macro OvO): 0.542 +/- 0.082 (in 3 folds) au-PRC (weighted OvO): 0.522 +/- 0.099 (in 3 folds) au-PRC (macro OvO): 0.522 +/- 0.099 (in 3 folds) Accuracy: 0.559 +/- 0.071 (in 3 folds) MCC: 0.096 +/- 0.157 (in 3 folds) Global scores without abstention: Accuracy: 0.548 MCC: 0.089 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.475 +/- 0.024 (in 3 folds) MCC: 0.056 +/- 0.105 (in 3 folds) Unknown/abstention proportion: 0.138 +/- 0.142 (in 3 folds) Global scores with abstention: Accuracy: 0.476 MCC: 0.072 Unknown/abstention proportion: 0.131 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.57 0.55 0.56 99  M 0.52 0.40 0.45 92  Unknown 0.00 0.00 0.00 0  accuracy 0.48 191  macro avg 0.36 0.32 0.34 191 weighted avg 0.55 0.48 0.51 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.542 +/- 0.082 (in 3 folds) ROC-AUC (macro OvO): 0.542 +/- 0.082 (in 3 folds) au-PRC (weighted OvO): 0.522 +/- 0.099 (in 3 folds) au-PRC (macro OvO): 0.522 +/- 0.099 (in 3 folds) Accuracy: 0.534 +/- 0.042 (in 3 folds) MCC: 0.090 +/- 0.086 (in 3 folds) Global scores without abstention: Accuracy: 0.536 MCC: 0.047 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.461 +/- 0.087 (in 3 folds) MCC: 0.060 +/- 0.066 (in 3 folds) Unknown/abstention proportion: 0.138 +/- 0.142 (in 3 folds) Global scores with abstention: Accuracy: 0.466 MCC: 0.046 Unknown/abstention proportion: 0.131 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.54 0.71 0.61 99  M 0.51 0.21 0.29 92  Unknown 0.00 0.00 0.00 0  accuracy 0.47 191  macro avg 0.35 0.30 0.30 191 weighted avg 0.53 0.47 0.46 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.532 +/- 0.072 (in 3 folds) ROC-AUC (macro OvO): 0.532 +/- 0.072 (in 3 folds) au-PRC (weighted OvO): 0.554 +/- 0.062 (in 3 folds) au-PRC (macro OvO): 0.554 +/- 0.062 (in 3 folds) Accuracy: 0.541 +/- 0.050 (in 3 folds) MCC: 0.081 +/- 0.125 (in 3 folds) Global scores without abstention: Accuracy: 0.538 MCC: 0.071 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.525 +/- 0.035 (in 3 folds) MCC: 0.072 +/- 0.111 (in 3 folds) Unknown/abstention proportion: 0.042 +/- 0.038 (in 2 folds) ROC-AUC (weighted OvO): 0.540 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.540 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.537 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.537 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.524 MCC: 0.067 Unknown/abstention proportion: 0.026 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.55 0.59 0.57 99  M 0.53 0.46 0.49 92  Unknown 0.00 0.00 0.00 0  accuracy 0.52 191  macro avg 0.36 0.35 0.35 191 weighted avg 0.54 0.52 0.53 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.532 +/- 0.072 (in 3 folds) ROC-AUC (macro OvO): 0.532 +/- 0.072 (in 3 folds) au-PRC (weighted OvO): 0.554 +/- 0.062 (in 3 folds) au-PRC (macro OvO): 0.554 +/- 0.062 (in 3 folds) Accuracy: 0.485 +/- 0.056 (in 3 folds) MCC: -0.031 +/- 0.125 (in 3 folds) Global scores without abstention: Accuracy: 0.489 MCC: -0.031 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.473 +/- 0.071 (in 3 folds) MCC: -0.008 +/- 0.093 (in 3 folds) Unknown/abstention proportion: 0.042 +/- 0.038 (in 2 folds) ROC-AUC (weighted OvO): 0.540 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.540 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.537 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.537 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.476 MCC: -0.030 Unknown/abstention proportion: 0.026 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.50 0.60 0.55 99  M 0.46 0.35 0.40 92  Unknown 0.00 0.00 0.00 0  accuracy 0.48 191  macro avg 0.32 0.31 0.31 191 weighted avg 0.48 0.48 0.47 191
,,,


ridge_cv,ridge_cv.decision_thresholds_tuned,lasso_cv,lasso_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.488 +/- 0.030 (in 3 folds) ROC-AUC (macro OvO): 0.488 +/- 0.030 (in 3 folds) au-PRC (weighted OvO): 0.544 +/- 0.069 (in 3 folds) au-PRC (macro OvO): 0.544 +/- 0.069 (in 3 folds) Accuracy: 0.548 +/- 0.014 (in 3 folds) MCC: 0.009 +/- 0.015 (in 3 folds) Global scores without abstention: Accuracy: 0.547 MCC: 0.092 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.429 +/- 0.153 (in 3 folds) MCC: 0.069 +/- 0.037 (in 3 folds) Unknown/abstention proportion: 0.217 +/- 0.275 (in 3 folds) Global scores with abstention: Accuracy: 0.424 MCC: 0.078 Unknown/abstention proportion: 0.225 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.56 0.24 0.34 99  M 0.54 0.62 0.58 92  Unknown 0.00 0.00 0.00 0  accuracy 0.42 191  macro avg 0.37 0.29 0.31 191 weighted avg 0.55 0.42 0.45 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.488 +/- 0.030 (in 3 folds) ROC-AUC (macro OvO): 0.488 +/- 0.030 (in 3 folds) au-PRC (weighted OvO): 0.544 +/- 0.069 (in 3 folds) au-PRC (macro OvO): 0.544 +/- 0.069 (in 3 folds) Accuracy: 0.479 +/- 0.060 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.466 MCC: -0.076 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.364 +/- 0.093 (in 3 folds) MCC: -0.002 +/- 0.093 (in 3 folds) Unknown/abstention proportion: 0.217 +/- 0.275 (in 3 folds) Global scores with abstention: Accuracy: 0.361 MCC: -0.041 Unknown/abstention proportion: 0.225 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.44 0.25 0.32 99  M 0.48 0.48 0.48 92  Unknown 0.00 0.00 0.00 0  accuracy 0.36 191  macro avg 0.31 0.24 0.27 191 weighted avg 0.46 0.36 0.40 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.482 +/- 0.019 (in 3 folds) ROC-AUC (macro OvO): 0.482 +/- 0.019 (in 3 folds) au-PRC (weighted OvO): 0.538 +/- 0.057 (in 3 folds) au-PRC (macro OvO): 0.538 +/- 0.057 (in 3 folds) Accuracy: 0.535 +/- 0.045 (in 3 folds) MCC: -0.028 +/- 0.194 (in 3 folds) Global scores without abstention: Accuracy: 0.527 MCC: 0.049 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.411 +/- 0.120 (in 3 folds) MCC: -0.021 +/- 0.146 (in 3 folds) Unknown/abstention proportion: 0.217 +/- 0.275 (in 3 folds) Global scores with abstention: Accuracy: 0.408 MCC: 0.043 Unknown/abstention proportion: 0.225 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.52 0.29 0.37 99  M 0.53 0.53 0.53 92  Unknown 0.00 0.00 0.00 0  accuracy 0.41 191  macro avg 0.35 0.28 0.30 191 weighted avg 0.52 0.41 0.45 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.482 +/- 0.019 (in 3 folds) ROC-AUC (macro OvO): 0.482 +/- 0.019 (in 3 folds) au-PRC (weighted OvO): 0.538 +/- 0.057 (in 3 folds) au-PRC (macro OvO): 0.538 +/- 0.057 (in 3 folds) Accuracy: 0.541 +/- 0.037 (in 3 folds) MCC: 0.080 +/- 0.054 (in 3 folds) Global scores without abstention: Accuracy: 0.534 MCC: 0.077 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.417 +/- 0.125 (in 3 folds) MCC: 0.063 +/- 0.031 (in 3 folds) Unknown/abstention proportion: 0.217 +/- 0.275 (in 3 folds) Global scores with abstention: Accuracy: 0.414 MCC: 0.040 Unknown/abstention proportion: 0.225 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.52 0.48 0.50 99  M 0.56 0.34 0.42 92  Unknown 0.00 0.00 0.00 0  accuracy 0.41 191  macro avg 0.36 0.27 0.31 191 weighted avg 0.54 0.41 0.46 191
,,,


xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.482 +/- 0.016 (in 3 folds) ROC-AUC (macro OvO): 0.482 +/- 0.016 (in 3 folds) au-PRC (weighted OvO): 0.458 +/- 0.013 (in 3 folds) au-PRC (macro OvO): 0.458 +/- 0.013 (in 3 folds) Accuracy: 0.463 +/- 0.023 (in 3 folds) MCC: -0.046 +/- 0.060 (in 3 folds) Global scores without abstention: Accuracy: 0.463 MCC: -0.070 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.290 +/- 0.183 (in 3 folds) MCC: -0.058 +/- 0.048 (in 3 folds) Unknown/abstention proportion: 0.375 +/- 0.403 (in 3 folds) Global scores with abstention: Accuracy: 0.298 MCC: -0.040 Unknown/abstention proportion: 0.356 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.51 0.30 0.38 99  M 0.42 0.29 0.35 92  Unknown 0.00 0.00 0.00 0  accuracy 0.30 191  macro avg 0.31 0.20 0.24 191 weighted avg 0.47 0.30 0.36 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.482 +/- 0.016 (in 3 folds) ROC-AUC (macro OvO): 0.482 +/- 0.016 (in 3 folds) au-PRC (weighted OvO): 0.458 +/- 0.013 (in 3 folds) au-PRC (macro OvO): 0.458 +/- 0.013 (in 3 folds) Accuracy: 0.485 +/- 0.060 (in 3 folds) MCC: -0.003 +/- 0.109 (in 3 folds) Global scores without abstention: Accuracy: 0.488 MCC: -0.050 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.305 +/- 0.191 (in 3 folds) MCC: -0.043 +/- 0.070 (in 3 folds) Unknown/abstention proportion: 0.375 +/- 0.403 (in 3 folds) Global scores with abstention: Accuracy: 0.314 MCC: -0.019 Unknown/abstention proportion: 0.356 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.53 0.41 0.46 99  M 0.42 0.21 0.28 92  Unknown 0.00 0.00 0.00 0  accuracy 0.31 191  macro avg 0.32 0.21 0.25 191 weighted avg 0.48 0.31 0.37 191
,


---

# GeneLocus.BCR, TargetObsColumnEnum.covid_vs_healthy trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.994 +/- 0.001 (in 3 folds),0.994 +/- 0.001 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.963 +/- 0.018 (in 3 folds),0.903 +/- 0.041 (in 3 folds),0.963,0.898,0.994 +/- 0.000 (in 1 folds),0.994 +/- 0.000 (in 1 folds),0.998 +/- 0.000 (in 1 folds),0.998 +/- 0.000 (in 1 folds),0.953 +/- 0.016 (in 3 folds),0.876 +/- 0.031 (in 3 folds),0.016 +/- 0.000 (in 2 folds),0.953,0.873,0.01,Unknown,189.0,2.0,191.0,0.010471,False
ridge_cv,0.992 +/- 0.004 (in 3 folds),0.992 +/- 0.004 (in 3 folds),0.998 +/- 0.001 (in 3 folds),0.998 +/- 0.001 (in 3 folds),0.789 +/- 0.013 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.789,0.0,,,,,0.764 +/- 0.004 (in 3 folds),0.070 +/- 0.040 (in 3 folds),0.031 +/- 0.016 (in 3 folds),0.764,0.061,0.031,Unknown,185.0,6.0,191.0,0.031414,True
lasso_multiclass,0.992 +/- 0.003 (in 3 folds),0.992 +/- 0.003 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.963 +/- 0.018 (in 3 folds),0.897 +/- 0.048 (in 3 folds),0.963,0.892,0.993 +/- 0.000 (in 1 folds),0.993 +/- 0.000 (in 1 folds),0.998 +/- 0.000 (in 1 folds),0.998 +/- 0.000 (in 1 folds),0.953 +/- 0.016 (in 3 folds),0.870 +/- 0.041 (in 3 folds),0.016 +/- 0.000 (in 2 folds),0.953,0.866,0.01,Unknown,189.0,2.0,191.0,0.010471,False
elasticnet_cv,0.990 +/- 0.008 (in 3 folds),0.990 +/- 0.008 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.803 +/- 0.017 (in 3 folds),0.275 +/- 0.057 (in 3 folds),0.803,0.279,0.986 +/- 0.004 (in 2 folds),0.986 +/- 0.004 (in 2 folds),0.996 +/- 0.001 (in 2 folds),0.996 +/- 0.001 (in 2 folds),0.790 +/- 0.038 (in 3 folds),0.242 +/- 0.102 (in 3 folds),0.048 +/- 0.000 (in 1 folds),0.791,0.22,0.016,Unknown,188.0,3.0,191.0,0.015707,False
rf_multiclass,0.989 +/- 0.004 (in 3 folds),0.989 +/- 0.004 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.947 +/- 0.025 (in 3 folds),0.853 +/- 0.064 (in 3 folds),0.947,0.851,0.989 +/- 0.000 (in 1 folds),0.989 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.937 +/- 0.032 (in 3 folds),0.831 +/- 0.079 (in 3 folds),0.016 +/- 0.000 (in 2 folds),0.937,0.828,0.01,Unknown,189.0,2.0,191.0,0.010471,False
lasso_cv,0.988 +/- 0.010 (in 3 folds),0.988 +/- 0.010 (in 3 folds),0.996 +/- 0.003 (in 3 folds),0.996 +/- 0.003 (in 3 folds),0.867 +/- 0.043 (in 3 folds),0.559 +/- 0.185 (in 3 folds),0.868,0.578,0.989 +/- 0.000 (in 1 folds),0.989 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.858 +/- 0.049 (in 3 folds),0.523 +/- 0.228 (in 3 folds),0.016 +/- 0.000 (in 2 folds),0.859,0.549,0.01,Unknown,189.0,2.0,191.0,0.010471,False
xgboost,0.981 +/- 0.020 (in 3 folds),0.981 +/- 0.020 (in 3 folds),0.993 +/- 0.006 (in 3 folds),0.993 +/- 0.006 (in 3 folds),0.958 +/- 0.033 (in 3 folds),0.869 +/- 0.110 (in 3 folds),0.957,0.872,0.975 +/- 0.023 (in 2 folds),0.975 +/- 0.023 (in 2 folds),0.992 +/- 0.007 (in 2 folds),0.992 +/- 0.007 (in 2 folds),0.937 +/- 0.028 (in 3 folds),0.820 +/- 0.083 (in 3 folds),0.063 +/- 0.000 (in 1 folds),0.937,0.817,0.021,Unknown,187.0,4.0,191.0,0.020942,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.789 +/- 0.013 (in 3 folds),0.789 +/- 0.013 (in 3 folds),0.789 +/- 0.013 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.789,0.0,,,,,0.764 +/- 0.004 (in 3 folds),0.070 +/- 0.040 (in 3 folds),0.031 +/- 0.016 (in 3 folds),0.764,0.061,0.031,Unknown,185.0,6.0,191.0,0.031414,True
dummy_stratified,0.428 +/- 0.020 (in 3 folds),0.428 +/- 0.020 (in 3 folds),0.764 +/- 0.021 (in 3 folds),0.764 +/- 0.021 (in 3 folds),0.629 +/- 0.033 (in 3 folds),-0.150 +/- 0.034 (in 3 folds),0.628,-0.151,,,,,0.602 +/- 0.028 (in 3 folds),-0.120 +/- 0.034 (in 3 folds),0.042 +/- 0.010 (in 3 folds),0.602,-0.121,0.042,Unknown,183.0,8.0,191.0,0.041885,False
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.994 +/- 0.001 (in 3 folds),0.994 +/- 0.001 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.963 +/- 0.018 (in 3 folds),0.903 +/- 0.041 (in 3 folds),0.963,0.898,0.994 +/- 0.000 (in 1 folds),0.994 +/- 0.000 (in 1 folds),0.998 +/- 0.000 (in 1 folds),0.998 +/- 0.000 (in 1 folds),0.953 +/- 0.016 (in 3 folds),0.876 +/- 0.031 (in 3 folds),0.016 +/- 0.000 (in 2 folds),0.953,0.873,0.01,Unknown,189,2,191,0.010471,False
ridge_cv,0.992 +/- 0.004 (in 3 folds),0.992 +/- 0.004 (in 3 folds),0.998 +/- 0.001 (in 3 folds),0.998 +/- 0.001 (in 3 folds),0.789 +/- 0.013 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.789,0.0,,,,,0.764 +/- 0.004 (in 3 folds),0.070 +/- 0.040 (in 3 folds),0.031 +/- 0.016 (in 3 folds),0.764,0.061,0.031,Unknown,185,6,191,0.031414,True
lasso_multiclass,0.992 +/- 0.003 (in 3 folds),0.992 +/- 0.003 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.998 +/- 0.000 (in 3 folds),0.963 +/- 0.018 (in 3 folds),0.897 +/- 0.048 (in 3 folds),0.963,0.892,0.993 +/- 0.000 (in 1 folds),0.993 +/- 0.000 (in 1 folds),0.998 +/- 0.000 (in 1 folds),0.998 +/- 0.000 (in 1 folds),0.953 +/- 0.016 (in 3 folds),0.870 +/- 0.041 (in 3 folds),0.016 +/- 0.000 (in 2 folds),0.953,0.866,0.01,Unknown,189,2,191,0.010471,False
elasticnet_cv,0.990 +/- 0.008 (in 3 folds),0.990 +/- 0.008 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.803 +/- 0.017 (in 3 folds),0.275 +/- 0.057 (in 3 folds),0.803,0.279,0.986 +/- 0.004 (in 2 folds),0.986 +/- 0.004 (in 2 folds),0.996 +/- 0.001 (in 2 folds),0.996 +/- 0.001 (in 2 folds),0.790 +/- 0.038 (in 3 folds),0.242 +/- 0.102 (in 3 folds),0.048 +/- 0.000 (in 1 folds),0.791,0.22,0.016,Unknown,188,3,191,0.015707,False
rf_multiclass,0.989 +/- 0.004 (in 3 folds),0.989 +/- 0.004 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.997 +/- 0.001 (in 3 folds),0.947 +/- 0.025 (in 3 folds),0.853 +/- 0.064 (in 3 folds),0.947,0.851,0.989 +/- 0.000 (in 1 folds),0.989 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.937 +/- 0.032 (in 3 folds),0.831 +/- 0.079 (in 3 folds),0.016 +/- 0.000 (in 2 folds),0.937,0.828,0.01,Unknown,189,2,191,0.010471,False
lasso_cv,0.988 +/- 0.010 (in 3 folds),0.988 +/- 0.010 (in 3 folds),0.996 +/- 0.003 (in 3 folds),0.996 +/- 0.003 (in 3 folds),0.867 +/- 0.043 (in 3 folds),0.559 +/- 0.185 (in 3 folds),0.868,0.578,0.989 +/- 0.000 (in 1 folds),0.989 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.858 +/- 0.049 (in 3 folds),0.523 +/- 0.228 (in 3 folds),0.016 +/- 0.000 (in 2 folds),0.859,0.549,0.01,Unknown,189,2,191,0.010471,False
xgboost,0.981 +/- 0.020 (in 3 folds),0.981 +/- 0.020 (in 3 folds),0.993 +/- 0.006 (in 3 folds),0.993 +/- 0.006 (in 3 folds),0.958 +/- 0.033 (in 3 folds),0.869 +/- 0.110 (in 3 folds),0.957,0.872,0.975 +/- 0.023 (in 2 folds),0.975 +/- 0.023 (in 2 folds),0.992 +/- 0.007 (in 2 folds),0.992 +/- 0.007 (in 2 folds),0.937 +/- 0.028 (in 3 folds),0.820 +/- 0.083 (in 3 folds),0.063 +/- 0.000 (in 1 folds),0.937,0.817,0.021,Unknown,187,4,191,0.020942,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.789 +/- 0.013 (in 3 folds),0.789 +/- 0.013 (in 3 folds),0.789 +/- 0.013 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.789,0.0,,,,,0.764 +/- 0.004 (in 3 folds),0.070 +/- 0.040 (in 3 folds),0.031 +/- 0.016 (in 3 folds),0.764,0.061,0.031,Unknown,185,6,191,0.031414,True
dummy_stratified,0.428 +/- 0.020 (in 3 folds),0.428 +/- 0.020 (in 3 folds),0.764 +/- 0.021 (in 3 folds),0.764 +/- 0.021 (in 3 folds),0.629 +/- 0.033 (in 3 folds),-0.150 +/- 0.034 (in 3 folds),0.628,-0.151,,,,,0.602 +/- 0.028 (in 3 folds),-0.120 +/- 0.034 (in 3 folds),0.042 +/- 0.010 (in 3 folds),0.602,-0.121,0.042,Unknown,183,8,191,0.041885,False


linearsvm_ovr,ridge_cv,lasso_multiclass,elasticnet_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.994 +/- 0.001 (in 3 folds) ROC-AUC (macro OvO): 0.994 +/- 0.001 (in 3 folds) au-PRC (weighted OvO): 0.998 +/- 0.000 (in 3 folds) au-PRC (macro OvO): 0.998 +/- 0.000 (in 3 folds) Accuracy: 0.963 +/- 0.018 (in 3 folds) MCC: 0.903 +/- 0.041 (in 3 folds) Global scores without abstention: Accuracy: 0.963 MCC: 0.898 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.994 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.994 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.998 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.998 +/- 0.000 (in 1 folds) Accuracy: 0.953 +/- 0.016 (in 3 folds) MCC: 0.876 +/- 0.031 (in 3 folds) Unknown/abstention proportion: 0.016 +/- 0.000 (in 2 folds) Global scores with abstention: Accuracy: 0.953 MCC: 0.873 Unknown/abstention proportion: 0.010 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.87 0.95 0.91 42 Healthy/Background 0.99 0.95 0.97 149  Unknown 0.00 0.00 0.00 0  accuracy 0.95 191  macro avg 0.62 0.64 0.63 191  weighted avg 0.97 0.95 0.96 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.992 +/- 0.004 (in 3 folds) ROC-AUC (macro OvO): 0.992 +/- 0.004 (in 3 folds) au-PRC (weighted OvO): 0.998 +/- 0.001 (in 3 folds) au-PRC (macro OvO): 0.998 +/- 0.001 (in 3 folds) Accuracy: 0.789 +/- 0.013 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.789 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.764 +/- 0.004 (in 3 folds) MCC: 0.070 +/- 0.040 (in 3 folds) Unknown/abstention proportion: 0.031 +/- 0.016 (in 3 folds) Global scores with abstention: Accuracy: 0.764 MCC: 0.061 Unknown/abstention proportion: 0.031 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.00 0.00 0.00 42 Healthy/Background 0.79 0.98 0.87 149  Unknown 0.00 0.00 0.00 0  accuracy 0.76 191  macro avg 0.26 0.33 0.29 191  weighted avg 0.62 0.76 0.68 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.992 +/- 0.003 (in 3 folds) ROC-AUC (macro OvO): 0.992 +/- 0.003 (in 3 folds) au-PRC (weighted OvO): 0.998 +/- 0.000 (in 3 folds) au-PRC (macro OvO): 0.998 +/- 0.000 (in 3 folds) Accuracy: 0.963 +/- 0.018 (in 3 folds) MCC: 0.897 +/- 0.048 (in 3 folds) Global scores without abstention: Accuracy: 0.963 MCC: 0.892 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.993 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.993 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.998 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.998 +/- 0.000 (in 1 folds) Accuracy: 0.953 +/- 0.016 (in 3 folds) MCC: 0.870 +/- 0.041 (in 3 folds) Unknown/abstention proportion: 0.016 +/- 0.000 (in 2 folds) Global scores with abstention: Accuracy: 0.953 MCC: 0.866 Unknown/abstention proportion: 0.010 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.90 0.90 0.90 42 Healthy/Background 0.98 0.97 0.97 149  Unknown 0.00 0.00 0.00 0  accuracy 0.95 191  macro avg 0.63 0.62 0.63 191  weighted avg 0.96 0.95 0.96 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.990 +/- 0.008 (in 3 folds) ROC-AUC (macro OvO): 0.990 +/- 0.008 (in 3 folds) au-PRC (weighted OvO): 0.997 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.997 +/- 0.002 (in 3 folds) Accuracy: 0.803 +/- 0.017 (in 3 folds) MCC: 0.275 +/- 0.057 (in 3 folds) Global scores without abstention: Accuracy: 0.803 MCC: 0.279 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.986 +/- 0.004 (in 2 folds) ROC-AUC (macro OvO): 0.986 +/- 0.004 (in 2 folds) au-PRC (weighted OvO): 0.996 +/- 0.001 (in 2 folds) au-PRC (macro OvO): 0.996 +/- 0.001 (in 2 folds) Accuracy: 0.790 +/- 0.038 (in 3 folds) MCC: 0.242 +/- 0.102 (in 3 folds) Unknown/abstention proportion: 0.048 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.791 MCC: 0.220 Unknown/abstention proportion: 0.016 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 1.00 0.10 0.17 42 Healthy/Background 0.80 0.99 0.88 149  Unknown 0.00 0.00 0.00 0  accuracy 0.79 191  macro avg 0.60 0.36 0.35 191  weighted avg 0.84 0.79 0.73 191
,,,


rf_multiclass,lasso_cv,xgboost,dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.989 +/- 0.004 (in 3 folds) ROC-AUC (macro OvO): 0.989 +/- 0.004 (in 3 folds) au-PRC (weighted OvO): 0.997 +/- 0.001 (in 3 folds) au-PRC (macro OvO): 0.997 +/- 0.001 (in 3 folds) Accuracy: 0.947 +/- 0.025 (in 3 folds) MCC: 0.853 +/- 0.064 (in 3 folds) Global scores without abstention: Accuracy: 0.947 MCC: 0.851 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.989 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.989 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.997 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.997 +/- 0.000 (in 1 folds) Accuracy: 0.937 +/- 0.032 (in 3 folds) MCC: 0.831 +/- 0.079 (in 3 folds) Unknown/abstention proportion: 0.016 +/- 0.000 (in 2 folds) Global scores with abstention: Accuracy: 0.937 MCC: 0.828 Unknown/abstention proportion: 0.010 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.84 0.90 0.87 42 Healthy/Background 0.98 0.95 0.96 149  Unknown 0.00 0.00 0.00 0  accuracy 0.94 191  macro avg 0.61 0.62 0.61 191  weighted avg 0.95 0.94 0.94 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.988 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.988 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.996 +/- 0.003 (in 3 folds) au-PRC (macro OvO): 0.996 +/- 0.003 (in 3 folds) Accuracy: 0.867 +/- 0.043 (in 3 folds) MCC: 0.559 +/- 0.185 (in 3 folds) Global scores without abstention: Accuracy: 0.868 MCC: 0.578 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.989 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.989 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.996 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.996 +/- 0.000 (in 1 folds) Accuracy: 0.858 +/- 0.049 (in 3 folds) MCC: 0.523 +/- 0.228 (in 3 folds) Unknown/abstention proportion: 0.016 +/- 0.000 (in 2 folds) Global scores with abstention: Accuracy: 0.859 MCC: 0.549 Unknown/abstention proportion: 0.010 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 1.00 0.38 0.55 42 Healthy/Background 0.86 0.99 0.92 149  Unknown 0.00 0.00 0.00 0  accuracy 0.86 191  macro avg 0.62 0.46 0.49 191  weighted avg 0.89 0.86 0.84 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.981 +/- 0.020 (in 3 folds) ROC-AUC (macro OvO): 0.981 +/- 0.020 (in 3 folds) au-PRC (weighted OvO): 0.993 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.993 +/- 0.006 (in 3 folds) Accuracy: 0.958 +/- 0.033 (in 3 folds) MCC: 0.869 +/- 0.110 (in 3 folds) Global scores without abstention: Accuracy: 0.957 MCC: 0.872 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.975 +/- 0.023 (in 2 folds) ROC-AUC (macro OvO): 0.975 +/- 0.023 (in 2 folds) au-PRC (weighted OvO): 0.992 +/- 0.007 (in 2 folds) au-PRC (macro OvO): 0.992 +/- 0.007 (in 2 folds) Accuracy: 0.937 +/- 0.028 (in 3 folds) MCC: 0.820 +/- 0.083 (in 3 folds) Unknown/abstention proportion: 0.063 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.937 MCC: 0.817 Unknown/abstention proportion: 0.021 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.97 0.81 0.88 42 Healthy/Background 0.95 0.97 0.96 149  Unknown 0.00 0.00 0.00 0  accuracy 0.94 191  macro avg 0.64 0.59 0.62 191  weighted avg 0.96 0.94 0.95 191,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.789 +/- 0.013 (in 3 folds) au-PRC (macro OvO): 0.789 +/- 0.013 (in 3 folds) Accuracy: 0.789 +/- 0.013 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.789 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.764 +/- 0.004 (in 3 folds) MCC: 0.070 +/- 0.040 (in 3 folds) Unknown/abstention proportion: 0.031 +/- 0.016 (in 3 folds) Global scores with abstention: Accuracy: 0.764 MCC: 0.061 Unknown/abstention proportion: 0.031 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.00 0.00 0.00 42 Healthy/Background 0.79 0.98 0.87 149  Unknown 0.00 0.00 0.00 0  accuracy 0.76 191  macro avg 0.26 0.33 0.29 191  weighted avg 0.62 0.76 0.68 191
,,,


dummy_stratified
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.428 +/- 0.020 (in 3 folds) ROC-AUC (macro OvO): 0.428 +/- 0.020 (in 3 folds) au-PRC (weighted OvO): 0.764 +/- 0.021 (in 3 folds) au-PRC (macro OvO): 0.764 +/- 0.021 (in 3 folds) Accuracy: 0.629 +/- 0.033 (in 3 folds) MCC: -0.150 +/- 0.034 (in 3 folds) Global scores without abstention: Accuracy: 0.628 MCC: -0.151 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.602 +/- 0.028 (in 3 folds) MCC: -0.120 +/- 0.034 (in 3 folds) Unknown/abstention proportion: 0.042 +/- 0.010 (in 3 folds) Global scores with abstention: Accuracy: 0.602 MCC: -0.121 Unknown/abstention proportion: 0.042 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.09 0.07 0.08 42 Healthy/Background 0.76 0.75 0.75 149  Unknown 0.00 0.00 0.00 0  accuracy 0.60 191  macro avg 0.28 0.27 0.28 191  weighted avg 0.61 0.60 0.61 191


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.991 +/- 0.007 (in 3 folds),0.991 +/- 0.007 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.776 +/- 0.010 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.776,0.0,disease.separate_past_exposures,0.757 +/- 0.010 (in 3 folds),-0.018 +/- 0.036 (in 3 folds),0.025 +/- 0.007 (in 3 folds),,,,,0.757,-0.015,0.025,Unknown,disease.separate_past_exposures,277.0,7.0,284.0,0.024648,True
ridge_cv.decision_thresholds_tuned,0.991 +/- 0.007 (in 3 folds),0.991 +/- 0.007 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.776 +/- 0.010 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.776,0.0,disease.separate_past_exposures,0.757 +/- 0.010 (in 3 folds),-0.018 +/- 0.036 (in 3 folds),0.025 +/- 0.007 (in 3 folds),,,,,0.757,-0.015,0.025,Unknown,disease.separate_past_exposures,277.0,7.0,284.0,0.024648,True
linearsvm_ovr,0.988 +/- 0.005 (in 3 folds),0.988 +/- 0.005 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.946 +/- 0.023 (in 3 folds),0.849 +/- 0.067 (in 3 folds),0.946,0.85,disease.separate_past_exposures,0.933 +/- 0.033 (in 3 folds),0.819 +/- 0.089 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.993 +/- 0.000 (in 1 folds),0.993 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.933,0.819,0.014,Unknown,disease.separate_past_exposures,280.0,4.0,284.0,0.014085,False
linearsvm_ovr.decision_thresholds_tuned,0.988 +/- 0.005 (in 3 folds),0.988 +/- 0.005 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.953 +/- 0.036 (in 3 folds),0.862 +/- 0.110 (in 3 folds),0.954,0.865,disease.separate_past_exposures,0.940 +/- 0.041 (in 3 folds),0.829 +/- 0.119 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.993 +/- 0.000 (in 1 folds),0.993 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.94,0.831,0.014,Unknown,disease.separate_past_exposures,280.0,4.0,284.0,0.014085,False
lasso_cv,0.988 +/- 0.003 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.868 +/- 0.025 (in 3 folds),0.580 +/- 0.109 (in 3 folds),0.868,0.587,disease.separate_past_exposures,0.856 +/- 0.032 (in 3 folds),0.532 +/- 0.150 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.989 +/- 0.000 (in 1 folds),0.989 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.856,0.542,0.014,Unknown,disease.separate_past_exposures,280.0,4.0,284.0,0.014085,False
lasso_cv.decision_thresholds_tuned,0.988 +/- 0.003 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.940 +/- 0.042 (in 3 folds),0.843 +/- 0.091 (in 3 folds),0.939,0.827,disease.separate_past_exposures,0.926 +/- 0.031 (in 3 folds),0.806 +/- 0.066 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.989 +/- 0.000 (in 1 folds),0.989 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.926,0.796,0.014,Unknown,disease.separate_past_exposures,280.0,4.0,284.0,0.014085,False
lasso_multiclass,0.986 +/- 0.010 (in 3 folds),0.986 +/- 0.010 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.949 +/- 0.042 (in 3 folds),0.852 +/- 0.126 (in 3 folds),0.95,0.855,disease.separate_past_exposures,0.936 +/- 0.047 (in 3 folds),0.821 +/- 0.134 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.993 +/- 0.000 (in 1 folds),0.993 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.937,0.822,0.014,Unknown,disease.separate_past_exposures,280.0,4.0,284.0,0.014085,False
lasso_multiclass.decision_thresholds_tuned,0.986 +/- 0.010 (in 3 folds),0.986 +/- 0.010 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.924 +/- 0.040 (in 3 folds),0.797 +/- 0.101 (in 3 folds),0.925,0.793,disease.separate_past_exposures,0.912 +/- 0.050 (in 3 folds),0.771 +/- 0.124 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.993 +/- 0.000 (in 1 folds),0.993 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.912,0.764,0.014,Unknown,disease.separate_past_exposures,280.0,4.0,284.0,0.014085,False
elasticnet_cv,0.985 +/- 0.006 (in 3 folds),0.985 +/- 0.006 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.801 +/- 0.020 (in 3 folds),0.230 +/- 0.048 (in 3 folds),0.801,0.233,disease.separate_past_exposures,0.778 +/- 0.009 (in 3 folds),0.194 +/- 0.034 (in 3 folds),0.042 +/- 0.029 (in 2 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.778,0.177,0.028,Unknown,disease.separate_past_exposures,276.0,8.0,284.0,0.028169,False
elasticnet_cv.decision_thresholds_tuned,0.985 +/- 0.006 (in 3 folds),0.985 +/- 0.006 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.945 +/- 0.024 (in 3 folds),0.833 +/- 0.081 (in 3 folds),0.946,0.837,disease.separate_past_exposures,0.919 +/- 0.053 (in 3 folds),0.778 +/- 0.138 (in 3 folds),0.042 +/- 0.029 (in 2 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.919,0.775,0.028,Unknown,disease.separate_past_exposures,276.0,8.0,284.0,0.028169,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.991 +/- 0.007 (in 3 folds),0.991 +/- 0.007 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.776 +/- 0.010 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.776,0.0,disease.separate_past_exposures,0.757 +/- 0.010 (in 3 folds),-0.018 +/- 0.036 (in 3 folds),0.025 +/- 0.007 (in 3 folds),,,,,0.757,-0.015,0.025,Unknown,disease.separate_past_exposures,277,7,284,0.024648,True
ridge_cv.decision_thresholds_tuned,0.991 +/- 0.007 (in 3 folds),0.991 +/- 0.007 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.997 +/- 0.002 (in 3 folds),0.776 +/- 0.010 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.776,0.0,disease.separate_past_exposures,0.757 +/- 0.010 (in 3 folds),-0.018 +/- 0.036 (in 3 folds),0.025 +/- 0.007 (in 3 folds),,,,,0.757,-0.015,0.025,Unknown,disease.separate_past_exposures,277,7,284,0.024648,True
linearsvm_ovr,0.988 +/- 0.005 (in 3 folds),0.988 +/- 0.005 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.946 +/- 0.023 (in 3 folds),0.849 +/- 0.067 (in 3 folds),0.946,0.85,disease.separate_past_exposures,0.933 +/- 0.033 (in 3 folds),0.819 +/- 0.089 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.993 +/- 0.000 (in 1 folds),0.993 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.933,0.819,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
linearsvm_ovr.decision_thresholds_tuned,0.988 +/- 0.005 (in 3 folds),0.988 +/- 0.005 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.953 +/- 0.036 (in 3 folds),0.862 +/- 0.110 (in 3 folds),0.954,0.865,disease.separate_past_exposures,0.940 +/- 0.041 (in 3 folds),0.829 +/- 0.119 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.993 +/- 0.000 (in 1 folds),0.993 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.94,0.831,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
lasso_cv,0.988 +/- 0.003 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.868 +/- 0.025 (in 3 folds),0.580 +/- 0.109 (in 3 folds),0.868,0.587,disease.separate_past_exposures,0.856 +/- 0.032 (in 3 folds),0.532 +/- 0.150 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.989 +/- 0.000 (in 1 folds),0.989 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.856,0.542,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
lasso_cv.decision_thresholds_tuned,0.988 +/- 0.003 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.996 +/- 0.001 (in 3 folds),0.940 +/- 0.042 (in 3 folds),0.843 +/- 0.091 (in 3 folds),0.939,0.827,disease.separate_past_exposures,0.926 +/- 0.031 (in 3 folds),0.806 +/- 0.066 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.989 +/- 0.000 (in 1 folds),0.989 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.996 +/- 0.000 (in 1 folds),0.926,0.796,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
lasso_multiclass,0.986 +/- 0.010 (in 3 folds),0.986 +/- 0.010 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.949 +/- 0.042 (in 3 folds),0.852 +/- 0.126 (in 3 folds),0.95,0.855,disease.separate_past_exposures,0.936 +/- 0.047 (in 3 folds),0.821 +/- 0.134 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.993 +/- 0.000 (in 1 folds),0.993 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.937,0.822,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
lasso_multiclass.decision_thresholds_tuned,0.986 +/- 0.010 (in 3 folds),0.986 +/- 0.010 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.996 +/- 0.002 (in 3 folds),0.924 +/- 0.040 (in 3 folds),0.797 +/- 0.101 (in 3 folds),0.925,0.793,disease.separate_past_exposures,0.912 +/- 0.050 (in 3 folds),0.771 +/- 0.124 (in 3 folds),0.021 +/- 0.000 (in 2 folds),0.993 +/- 0.000 (in 1 folds),0.993 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.912,0.764,0.014,Unknown,disease.separate_past_exposures,280,4,284,0.014085,False
elasticnet_cv,0.985 +/- 0.006 (in 3 folds),0.985 +/- 0.006 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.801 +/- 0.020 (in 3 folds),0.230 +/- 0.048 (in 3 folds),0.801,0.233,disease.separate_past_exposures,0.778 +/- 0.009 (in 3 folds),0.194 +/- 0.034 (in 3 folds),0.042 +/- 0.029 (in 2 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.778,0.177,0.028,Unknown,disease.separate_past_exposures,276,8,284,0.028169,False
elasticnet_cv.decision_thresholds_tuned,0.985 +/- 0.006 (in 3 folds),0.985 +/- 0.006 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.995 +/- 0.002 (in 3 folds),0.945 +/- 0.024 (in 3 folds),0.833 +/- 0.081 (in 3 folds),0.946,0.837,disease.separate_past_exposures,0.919 +/- 0.053 (in 3 folds),0.778 +/- 0.138 (in 3 folds),0.042 +/- 0.029 (in 2 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.997 +/- 0.000 (in 1 folds),0.919,0.775,0.028,Unknown,disease.separate_past_exposures,276,8,284,0.028169,False


ridge_cv,ridge_cv.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.991 +/- 0.007 (in 3 folds) ROC-AUC (macro OvO): 0.991 +/- 0.007 (in 3 folds) au-PRC (weighted OvO): 0.997 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.997 +/- 0.002 (in 3 folds) Accuracy: 0.776 +/- 0.010 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.776 MCC: 0.000 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.757 +/- 0.010 (in 3 folds) MCC: -0.018 +/- 0.036 (in 3 folds) Unknown/abstention proportion: 0.025 +/- 0.007 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.757 MCC: -0.015 Unknown/abstention proportion: 0.025 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.00 0.00 0.00 63 Healthy/Background 0.78 0.97 0.86 221  Unknown 0.00 0.00 0.00 0  accuracy 0.76 284  macro avg 0.26 0.32 0.29 284  weighted avg 0.60 0.76 0.67 284,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.991 +/- 0.007 (in 3 folds) ROC-AUC (macro OvO): 0.991 +/- 0.007 (in 3 folds) au-PRC (weighted OvO): 0.997 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.997 +/- 0.002 (in 3 folds) Accuracy: 0.776 +/- 0.010 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.776 MCC: 0.000 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.757 +/- 0.010 (in 3 folds) MCC: -0.018 +/- 0.036 (in 3 folds) Unknown/abstention proportion: 0.025 +/- 0.007 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.757 MCC: -0.015 Unknown/abstention proportion: 0.025 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.00 0.00 0.00 63 Healthy/Background 0.78 0.97 0.86 221  Unknown 0.00 0.00 0.00 0  accuracy 0.76 284  macro avg 0.26 0.32 0.29 284  weighted avg 0.60 0.76 0.67 284,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.988 +/- 0.005 (in 3 folds) ROC-AUC (macro OvO): 0.988 +/- 0.005 (in 3 folds) au-PRC (weighted OvO): 0.996 +/- 0.001 (in 3 folds) au-PRC (macro OvO): 0.996 +/- 0.001 (in 3 folds) Accuracy: 0.946 +/- 0.023 (in 3 folds) MCC: 0.849 +/- 0.067 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.946 MCC: 0.850 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.933 +/- 0.033 (in 3 folds) MCC: 0.819 +/- 0.089 (in 3 folds) Unknown/abstention proportion: 0.021 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.993 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.993 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.997 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.997 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.933 MCC: 0.819 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.85 0.90 0.88 63 Healthy/Background 0.98 0.94 0.96 221  Unknown 0.00 0.00 0.00 0  accuracy 0.93 284  macro avg 0.61 0.62 0.61 284  weighted avg 0.95 0.93 0.94 284,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.988 +/- 0.005 (in 3 folds) ROC-AUC (macro OvO): 0.988 +/- 0.005 (in 3 folds) au-PRC (weighted OvO): 0.996 +/- 0.001 (in 3 folds) au-PRC (macro OvO): 0.996 +/- 0.001 (in 3 folds) Accuracy: 0.953 +/- 0.036 (in 3 folds) MCC: 0.862 +/- 0.110 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.954 MCC: 0.865 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.940 +/- 0.041 (in 3 folds) MCC: 0.829 +/- 0.119 (in 3 folds) Unknown/abstention proportion: 0.021 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.993 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.993 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.997 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.997 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.940 MCC: 0.831 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.90 0.87 0.89 63 Healthy/Background 0.97 0.96 0.96 221  Unknown 0.00 0.00 0.00 0  accuracy 0.94 284  macro avg 0.62 0.61 0.62 284  weighted avg 0.95 0.94 0.95 284
,,,


lasso_cv,lasso_cv.decision_thresholds_tuned,lasso_multiclass,lasso_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.988 +/- 0.003 (in 3 folds) ROC-AUC (macro OvO): 0.988 +/- 0.003 (in 3 folds) au-PRC (weighted OvO): 0.996 +/- 0.001 (in 3 folds) au-PRC (macro OvO): 0.996 +/- 0.001 (in 3 folds) Accuracy: 0.868 +/- 0.025 (in 3 folds) MCC: 0.580 +/- 0.109 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.868 MCC: 0.587 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.856 +/- 0.032 (in 3 folds) MCC: 0.532 +/- 0.150 (in 3 folds) Unknown/abstention proportion: 0.021 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.989 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.989 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.996 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.996 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.856 MCC: 0.542 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 1.00 0.40 0.57 63 Healthy/Background 0.85 0.99 0.92 221  Unknown 0.00 0.00 0.00 0  accuracy 0.86 284  macro avg 0.62 0.46 0.49 284  weighted avg 0.89 0.86 0.84 284,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.988 +/- 0.003 (in 3 folds) ROC-AUC (macro OvO): 0.988 +/- 0.003 (in 3 folds) au-PRC (weighted OvO): 0.996 +/- 0.001 (in 3 folds) au-PRC (macro OvO): 0.996 +/- 0.001 (in 3 folds) Accuracy: 0.940 +/- 0.042 (in 3 folds) MCC: 0.843 +/- 0.091 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.939 MCC: 0.827 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.926 +/- 0.031 (in 3 folds) MCC: 0.806 +/- 0.066 (in 3 folds) Unknown/abstention proportion: 0.021 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.989 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.989 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.996 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.996 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.926 MCC: 0.796 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.85 0.87 0.86 63 Healthy/Background 0.97 0.94 0.95 221  Unknown 0.00 0.00 0.00 0  accuracy 0.93 284  macro avg 0.60 0.60 0.60 284  weighted avg 0.94 0.93 0.93 284,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.986 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.986 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.996 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.996 +/- 0.002 (in 3 folds) Accuracy: 0.949 +/- 0.042 (in 3 folds) MCC: 0.852 +/- 0.126 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.950 MCC: 0.855 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.936 +/- 0.047 (in 3 folds) MCC: 0.821 +/- 0.134 (in 3 folds) Unknown/abstention proportion: 0.021 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.993 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.993 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.997 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.997 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.937 MCC: 0.822 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.89 0.87 0.88 63 Healthy/Background 0.97 0.95 0.96 221  Unknown 0.00 0.00 0.00 0  accuracy 0.94 284  macro avg 0.62 0.61 0.61 284  weighted avg 0.95 0.94 0.94 284,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.986 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.986 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.996 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.996 +/- 0.002 (in 3 folds) Accuracy: 0.924 +/- 0.040 (in 3 folds) MCC: 0.797 +/- 0.101 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.925 MCC: 0.793 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.912 +/- 0.050 (in 3 folds) MCC: 0.771 +/- 0.124 (in 3 folds) Unknown/abstention proportion: 0.021 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.993 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.993 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.997 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.997 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.912 MCC: 0.764 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.80 0.87 0.83 63 Healthy/Background 0.97 0.92 0.94 221  Unknown 0.00 0.00 0.00 0  accuracy 0.91 284  macro avg 0.59 0.60 0.59 284  weighted avg 0.93 0.91 0.92 284
,,,


elasticnet_cv,elasticnet_cv.decision_thresholds_tuned,xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.985 +/- 0.006 (in 3 folds) ROC-AUC (macro OvO): 0.985 +/- 0.006 (in 3 folds) au-PRC (weighted OvO): 0.995 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.995 +/- 0.002 (in 3 folds) Accuracy: 0.801 +/- 0.020 (in 3 folds) MCC: 0.230 +/- 0.048 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.801 MCC: 0.233 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.778 +/- 0.009 (in 3 folds) MCC: 0.194 +/- 0.034 (in 3 folds) Unknown/abstention proportion: 0.042 +/- 0.029 (in 2 folds) ROC-AUC (weighted OvO): 0.992 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.992 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.997 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.997 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.778 MCC: 0.177 Unknown/abstention proportion: 0.028 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 1.00 0.06 0.12 63 Healthy/Background 0.80 0.98 0.88 221  Unknown 0.00 0.00 0.00 0  accuracy 0.78 284  macro avg 0.60 0.35 0.33 284  weighted avg 0.84 0.78 0.71 284,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.985 +/- 0.006 (in 3 folds) ROC-AUC (macro OvO): 0.985 +/- 0.006 (in 3 folds) au-PRC (weighted OvO): 0.995 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.995 +/- 0.002 (in 3 folds) Accuracy: 0.945 +/- 0.024 (in 3 folds) MCC: 0.833 +/- 0.081 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.946 MCC: 0.837 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.919 +/- 0.053 (in 3 folds) MCC: 0.778 +/- 0.138 (in 3 folds) Unknown/abstention proportion: 0.042 +/- 0.029 (in 2 folds) ROC-AUC (weighted OvO): 0.992 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.992 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.997 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.997 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.919 MCC: 0.775 Unknown/abstention proportion: 0.028 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.88 0.81 0.84 63 Healthy/Background 0.96 0.95 0.96 221  Unknown 0.00 0.00 0.00 0  accuracy 0.92 284  macro avg 0.61 0.59 0.60 284  weighted avg 0.94 0.92 0.93 284,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.971 +/- 0.014 (in 3 folds) ROC-AUC (macro OvO): 0.971 +/- 0.014 (in 3 folds) au-PRC (weighted OvO): 0.989 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.989 +/- 0.006 (in 3 folds) Accuracy: 0.948 +/- 0.034 (in 3 folds) MCC: 0.847 +/- 0.094 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.949 MCC: 0.849 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.912 +/- 0.060 (in 3 folds) MCC: 0.771 +/- 0.150 (in 3 folds) Unknown/abstention proportion: 0.058 +/- 0.052 (in 2 folds) ROC-AUC (weighted OvO): 0.983 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.983 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.994 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.994 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.912 MCC: 0.766 Unknown/abstention proportion: 0.039 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.87 0.83 0.85 63 Healthy/Background 0.97 0.94 0.95 221  Unknown 0.00 0.00 0.00 0  accuracy 0.91 284  macro avg 0.61 0.59 0.60 284  weighted avg 0.95 0.91 0.93 284,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.971 +/- 0.014 (in 3 folds) ROC-AUC (macro OvO): 0.971 +/- 0.014 (in 3 folds) au-PRC (weighted OvO): 0.989 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.989 +/- 0.006 (in 3 folds) Accuracy: 0.948 +/- 0.034 (in 3 folds) MCC: 0.847 +/- 0.093 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.949 MCC: 0.847 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.912 +/- 0.060 (in 3 folds) MCC: 0.771 +/- 0.150 (in 3 folds) Unknown/abstention proportion: 0.058 +/- 0.052 (in 2 folds) ROC-AUC (weighted OvO): 0.983 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.983 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.994 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.994 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.912 MCC: 0.763 Unknown/abstention proportion: 0.039 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.88 0.81 0.84 63 Healthy/Background 0.97 0.94 0.95 221  Unknown 0.00 0.00 0.00 0  accuracy 0.91 284  macro avg 0.62 0.58 0.60 284  weighted avg 0.95 0.91 0.93 284
,,,


rf_multiclass,rf_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.962 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.962 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.986 +/- 0.005 (in 3 folds) au-PRC (macro OvO): 0.986 +/- 0.005 (in 3 folds) Accuracy: 0.929 +/- 0.010 (in 3 folds) MCC: 0.796 +/- 0.011 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.929 MCC: 0.791 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.915 +/- 0.001 (in 3 folds) MCC: 0.761 +/- 0.020 (in 3 folds) Unknown/abstention proportion: 0.021 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.974 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.974 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.990 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.990 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.915 MCC: 0.759 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.85 0.81 0.83 63 Healthy/Background 0.95 0.95 0.95 221  Unknown 0.00 0.00 0.00 0  accuracy 0.92 284  macro avg 0.60 0.59 0.59 284  weighted avg 0.93 0.92 0.92 284,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.962 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.962 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.986 +/- 0.005 (in 3 folds) au-PRC (macro OvO): 0.986 +/- 0.005 (in 3 folds) Accuracy: 0.946 +/- 0.012 (in 3 folds) MCC: 0.841 +/- 0.040 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.946 MCC: 0.840 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.933 +/- 0.023 (in 3 folds) MCC: 0.804 +/- 0.068 (in 3 folds) Unknown/abstention proportion: 0.021 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.974 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.974 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.990 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.990 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.933 MCC: 0.805 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.93 0.81 0.86 63 Healthy/Background 0.95 0.97 0.96 221  Unknown 0.00 0.00 0.00 0  accuracy 0.93 284  macro avg 0.63 0.59 0.61 284  weighted avg 0.95 0.93 0.94 284
,


---

# GeneLocus.BCR, TargetObsColumnEnum.hiv_vs_healthy trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.975 +/- 0.008 (in 3 folds),0.975 +/- 0.008 (in 3 folds),0.987 +/- 0.006 (in 3 folds),0.987 +/- 0.006 (in 3 folds),0.811 +/- 0.087 (in 3 folds),0.539 +/- 0.236 (in 3 folds),0.808,0.556,0.752 +/- 0.066 (in 3 folds),0.386 +/- 0.237 (in 3 folds),0.071 +/- 0.030 (in 3 folds),0.751,0.402,0.07,Unknown,198.0,15.0,213.0,0.070423,False,,,,
ridge_cv,0.973 +/- 0.005 (in 3 folds),0.973 +/- 0.005 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.701 +/- 0.006 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.701,0.0,0.695 +/- 0.014 (in 3 folds),0.012 +/- 0.021 (in 3 folds),0.028 +/- 0.000 (in 1 folds),0.695,0.021,0.009,Unknown,211.0,2.0,213.0,0.00939,True,0.972 +/- 0.007 (in 2 folds),0.972 +/- 0.007 (in 2 folds),0.988 +/- 0.004 (in 2 folds),0.988 +/- 0.004 (in 2 folds)
linearsvm_ovr,0.971 +/- 0.009 (in 3 folds),0.971 +/- 0.009 (in 3 folds),0.986 +/- 0.006 (in 3 folds),0.986 +/- 0.006 (in 3 folds),0.924 +/- 0.015 (in 3 folds),0.821 +/- 0.034 (in 3 folds),0.924,0.816,0.911 +/- 0.020 (in 3 folds),0.795 +/- 0.037 (in 3 folds),0.021 +/- 0.009 (in 2 folds),0.911,0.788,0.014,Unknown,210.0,3.0,213.0,0.014085,False,0.979 +/- 0.000 (in 1 folds),0.979 +/- 0.000 (in 1 folds),0.991 +/- 0.000 (in 1 folds),0.991 +/- 0.000 (in 1 folds)
lasso_cv,0.969 +/- 0.015 (in 3 folds),0.969 +/- 0.015 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.887 +/- 0.009 (in 3 folds),0.736 +/- 0.016 (in 3 folds),0.887,0.735,0.850 +/- 0.032 (in 3 folds),0.649 +/- 0.072 (in 3 folds),0.042 +/- 0.027 (in 3 folds),0.85,0.646,0.042,Unknown,204.0,9.0,213.0,0.042254,False,,,,
lasso_multiclass,0.969 +/- 0.006 (in 3 folds),0.969 +/- 0.006 (in 3 folds),0.985 +/- 0.005 (in 3 folds),0.985 +/- 0.005 (in 3 folds),0.933 +/- 0.016 (in 3 folds),0.839 +/- 0.041 (in 3 folds),0.933,0.839,0.911 +/- 0.020 (in 3 folds),0.793 +/- 0.049 (in 3 folds),0.023 +/- 0.008 (in 3 folds),0.911,0.792,0.023,Unknown,208.0,5.0,213.0,0.023474,False,,,,
xgboost,0.955 +/- 0.005 (in 3 folds),0.955 +/- 0.005 (in 3 folds),0.976 +/- 0.006 (in 3 folds),0.976 +/- 0.006 (in 3 folds),0.918 +/- 0.029 (in 3 folds),0.804 +/- 0.073 (in 3 folds),0.918,0.803,0.897 +/- 0.031 (in 3 folds),0.759 +/- 0.076 (in 3 folds),0.023 +/- 0.008 (in 3 folds),0.897,0.759,0.023,Unknown,208.0,5.0,213.0,0.023474,False,,,,
rf_multiclass,0.932 +/- 0.010 (in 3 folds),0.932 +/- 0.010 (in 3 folds),0.961 +/- 0.002 (in 3 folds),0.961 +/- 0.002 (in 3 folds),0.914 +/- 0.029 (in 3 folds),0.795 +/- 0.068 (in 3 folds),0.914,0.791,0.897 +/- 0.018 (in 3 folds),0.759 +/- 0.045 (in 3 folds),0.028 +/- 0.000 (in 2 folds),0.897,0.754,0.019,Unknown,209.0,4.0,213.0,0.018779,False,0.922 +/- 0.000 (in 1 folds),0.922 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds)
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.701 +/- 0.006 (in 3 folds),0.701 +/- 0.006 (in 3 folds),0.701 +/- 0.006 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.701,0.0,0.695 +/- 0.014 (in 3 folds),0.012 +/- 0.021 (in 3 folds),0.028 +/- 0.000 (in 1 folds),0.695,0.021,0.009,Unknown,211.0,2.0,213.0,0.00939,True,0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.702 +/- 0.009 (in 2 folds),0.702 +/- 0.009 (in 2 folds)
dummy_stratified,0.493 +/- 0.051 (in 3 folds),0.493 +/- 0.051 (in 3 folds),0.664 +/- 0.029 (in 3 folds),0.664 +/- 0.029 (in 3 folds),0.556 +/- 0.039 (in 3 folds),-0.016 +/- 0.105 (in 3 folds),0.556,-0.017,0.469 +/- 0.015 (in 3 folds),-0.038 +/- 0.091 (in 3 folds),0.154 +/- 0.046 (in 3 folds),0.469,-0.034,0.155,Unknown,180.0,33.0,213.0,0.15493,False,,,,
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.975 +/- 0.008 (in 3 folds),0.975 +/- 0.008 (in 3 folds),0.987 +/- 0.006 (in 3 folds),0.987 +/- 0.006 (in 3 folds),0.811 +/- 0.087 (in 3 folds),0.539 +/- 0.236 (in 3 folds),0.808,0.556,0.752 +/- 0.066 (in 3 folds),0.386 +/- 0.237 (in 3 folds),0.071 +/- 0.030 (in 3 folds),0.751,0.402,0.07,Unknown,198,15,213,0.070423,False,,,,
ridge_cv,0.973 +/- 0.005 (in 3 folds),0.973 +/- 0.005 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.988 +/- 0.003 (in 3 folds),0.701 +/- 0.006 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.701,0.0,0.695 +/- 0.014 (in 3 folds),0.012 +/- 0.021 (in 3 folds),0.028 +/- 0.000 (in 1 folds),0.695,0.021,0.009,Unknown,211,2,213,0.00939,True,0.972 +/- 0.007 (in 2 folds),0.972 +/- 0.007 (in 2 folds),0.988 +/- 0.004 (in 2 folds),0.988 +/- 0.004 (in 2 folds)
linearsvm_ovr,0.971 +/- 0.009 (in 3 folds),0.971 +/- 0.009 (in 3 folds),0.986 +/- 0.006 (in 3 folds),0.986 +/- 0.006 (in 3 folds),0.924 +/- 0.015 (in 3 folds),0.821 +/- 0.034 (in 3 folds),0.924,0.816,0.911 +/- 0.020 (in 3 folds),0.795 +/- 0.037 (in 3 folds),0.021 +/- 0.009 (in 2 folds),0.911,0.788,0.014,Unknown,210,3,213,0.014085,False,0.979 +/- 0.000 (in 1 folds),0.979 +/- 0.000 (in 1 folds),0.991 +/- 0.000 (in 1 folds),0.991 +/- 0.000 (in 1 folds)
lasso_cv,0.969 +/- 0.015 (in 3 folds),0.969 +/- 0.015 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.985 +/- 0.009 (in 3 folds),0.887 +/- 0.009 (in 3 folds),0.736 +/- 0.016 (in 3 folds),0.887,0.735,0.850 +/- 0.032 (in 3 folds),0.649 +/- 0.072 (in 3 folds),0.042 +/- 0.027 (in 3 folds),0.85,0.646,0.042,Unknown,204,9,213,0.042254,False,,,,
lasso_multiclass,0.969 +/- 0.006 (in 3 folds),0.969 +/- 0.006 (in 3 folds),0.985 +/- 0.005 (in 3 folds),0.985 +/- 0.005 (in 3 folds),0.933 +/- 0.016 (in 3 folds),0.839 +/- 0.041 (in 3 folds),0.933,0.839,0.911 +/- 0.020 (in 3 folds),0.793 +/- 0.049 (in 3 folds),0.023 +/- 0.008 (in 3 folds),0.911,0.792,0.023,Unknown,208,5,213,0.023474,False,,,,
xgboost,0.955 +/- 0.005 (in 3 folds),0.955 +/- 0.005 (in 3 folds),0.976 +/- 0.006 (in 3 folds),0.976 +/- 0.006 (in 3 folds),0.918 +/- 0.029 (in 3 folds),0.804 +/- 0.073 (in 3 folds),0.918,0.803,0.897 +/- 0.031 (in 3 folds),0.759 +/- 0.076 (in 3 folds),0.023 +/- 0.008 (in 3 folds),0.897,0.759,0.023,Unknown,208,5,213,0.023474,False,,,,
rf_multiclass,0.932 +/- 0.010 (in 3 folds),0.932 +/- 0.010 (in 3 folds),0.961 +/- 0.002 (in 3 folds),0.961 +/- 0.002 (in 3 folds),0.914 +/- 0.029 (in 3 folds),0.795 +/- 0.068 (in 3 folds),0.914,0.791,0.897 +/- 0.018 (in 3 folds),0.759 +/- 0.045 (in 3 folds),0.028 +/- 0.000 (in 2 folds),0.897,0.754,0.019,Unknown,209,4,213,0.018779,False,0.922 +/- 0.000 (in 1 folds),0.922 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds)
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.701 +/- 0.006 (in 3 folds),0.701 +/- 0.006 (in 3 folds),0.701 +/- 0.006 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.701,0.0,0.695 +/- 0.014 (in 3 folds),0.012 +/- 0.021 (in 3 folds),0.028 +/- 0.000 (in 1 folds),0.695,0.021,0.009,Unknown,211,2,213,0.00939,True,0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.702 +/- 0.009 (in 2 folds),0.702 +/- 0.009 (in 2 folds)
dummy_stratified,0.493 +/- 0.051 (in 3 folds),0.493 +/- 0.051 (in 3 folds),0.664 +/- 0.029 (in 3 folds),0.664 +/- 0.029 (in 3 folds),0.556 +/- 0.039 (in 3 folds),-0.016 +/- 0.105 (in 3 folds),0.556,-0.017,0.469 +/- 0.015 (in 3 folds),-0.038 +/- 0.091 (in 3 folds),0.154 +/- 0.046 (in 3 folds),0.469,-0.034,0.155,Unknown,180,33,213,0.15493,False,,,,


elasticnet_cv,ridge_cv,linearsvm_ovr,lasso_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.975 +/- 0.008 (in 3 folds) ROC-AUC (macro OvO): 0.975 +/- 0.008 (in 3 folds) au-PRC (weighted OvO): 0.987 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.987 +/- 0.006 (in 3 folds) Accuracy: 0.811 +/- 0.087 (in 3 folds) MCC: 0.539 +/- 0.236 (in 3 folds) Global scores without abstention: Accuracy: 0.808 MCC: 0.556 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.752 +/- 0.066 (in 3 folds) MCC: 0.386 +/- 0.237 (in 3 folds) Unknown/abstention proportion: 0.071 +/- 0.030 (in 3 folds) Global scores with abstention: Accuracy: 0.751 MCC: 0.402 Unknown/abstention proportion: 0.070 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  HIV 1.00 0.39 0.56 64 Healthy/Background 0.78 0.91 0.84 149  Unknown 0.00 0.00 0.00 0  accuracy 0.75 213  macro avg 0.59 0.43 0.47 213  weighted avg 0.85 0.75 0.76 213,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.973 +/- 0.005 (in 3 folds) ROC-AUC (macro OvO): 0.973 +/- 0.005 (in 3 folds) au-PRC (weighted OvO): 0.988 +/- 0.003 (in 3 folds) au-PRC (macro OvO): 0.988 +/- 0.003 (in 3 folds) Accuracy: 0.701 +/- 0.006 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.701 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.972 +/- 0.007 (in 2 folds) ROC-AUC (macro OvO): 0.972 +/- 0.007 (in 2 folds) au-PRC (weighted OvO): 0.988 +/- 0.004 (in 2 folds) au-PRC (macro OvO): 0.988 +/- 0.004 (in 2 folds) Accuracy: 0.695 +/- 0.014 (in 3 folds) MCC: 0.012 +/- 0.021 (in 3 folds) Unknown/abstention proportion: 0.028 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.695 MCC: 0.021 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  HIV 0.00 0.00 0.00 64 Healthy/Background 0.70 0.99 0.82 149  Unknown 0.00 0.00 0.00 0  accuracy 0.69 213  macro avg 0.23 0.33 0.27 213  weighted avg 0.49 0.69 0.58 213,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.971 +/- 0.009 (in 3 folds) ROC-AUC (macro OvO): 0.971 +/- 0.009 (in 3 folds) au-PRC (weighted OvO): 0.986 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.986 +/- 0.006 (in 3 folds) Accuracy: 0.924 +/- 0.015 (in 3 folds) MCC: 0.821 +/- 0.034 (in 3 folds) Global scores without abstention: Accuracy: 0.924 MCC: 0.816 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.979 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.979 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.991 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.991 +/- 0.000 (in 1 folds) Accuracy: 0.911 +/- 0.020 (in 3 folds) MCC: 0.795 +/- 0.037 (in 3 folds) Unknown/abstention proportion: 0.021 +/- 0.009 (in 2 folds) Global scores with abstention: Accuracy: 0.911 MCC: 0.788 Unknown/abstention proportion: 0.014 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  HIV 0.91 0.81 0.86 64 Healthy/Background 0.93 0.95 0.94 149  Unknown 0.00 0.00 0.00 0  accuracy 0.91 213  macro avg 0.61 0.59 0.60 213  weighted avg 0.92 0.91 0.92 213,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.969 +/- 0.015 (in 3 folds) ROC-AUC (macro OvO): 0.969 +/- 0.015 (in 3 folds) au-PRC (weighted OvO): 0.985 +/- 0.009 (in 3 folds) au-PRC (macro OvO): 0.985 +/- 0.009 (in 3 folds) Accuracy: 0.887 +/- 0.009 (in 3 folds) MCC: 0.736 +/- 0.016 (in 3 folds) Global scores without abstention: Accuracy: 0.887 MCC: 0.735 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.850 +/- 0.032 (in 3 folds) MCC: 0.649 +/- 0.072 (in 3 folds) Unknown/abstention proportion: 0.042 +/- 0.027 (in 3 folds) Global scores with abstention: Accuracy: 0.850 MCC: 0.646 Unknown/abstention proportion: 0.042 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  HIV 0.98 0.64 0.77 64 Healthy/Background 0.86 0.94 0.90 149  Unknown 0.00 0.00 0.00 0  accuracy 0.85 213  macro avg 0.61 0.53 0.56 213  weighted avg 0.90 0.85 0.86 213
,,,


lasso_multiclass,xgboost,rf_multiclass,dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.969 +/- 0.006 (in 3 folds) ROC-AUC (macro OvO): 0.969 +/- 0.006 (in 3 folds) au-PRC (weighted OvO): 0.985 +/- 0.005 (in 3 folds) au-PRC (macro OvO): 0.985 +/- 0.005 (in 3 folds) Accuracy: 0.933 +/- 0.016 (in 3 folds) MCC: 0.839 +/- 0.041 (in 3 folds) Global scores without abstention: Accuracy: 0.933 MCC: 0.839 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.911 +/- 0.020 (in 3 folds) MCC: 0.793 +/- 0.049 (in 3 folds) Unknown/abstention proportion: 0.023 +/- 0.008 (in 3 folds) Global scores with abstention: Accuracy: 0.911 MCC: 0.792 Unknown/abstention proportion: 0.023 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  HIV 0.92 0.84 0.88 64 Healthy/Background 0.94 0.94 0.94 149  Unknown 0.00 0.00 0.00 0  accuracy 0.91 213  macro avg 0.62 0.59 0.61 213  weighted avg 0.93 0.91 0.92 213,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.955 +/- 0.005 (in 3 folds) ROC-AUC (macro OvO): 0.955 +/- 0.005 (in 3 folds) au-PRC (weighted OvO): 0.976 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.976 +/- 0.006 (in 3 folds) Accuracy: 0.918 +/- 0.029 (in 3 folds) MCC: 0.804 +/- 0.073 (in 3 folds) Global scores without abstention: Accuracy: 0.918 MCC: 0.803 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.897 +/- 0.031 (in 3 folds) MCC: 0.759 +/- 0.076 (in 3 folds) Unknown/abstention proportion: 0.023 +/- 0.008 (in 3 folds) Global scores with abstention: Accuracy: 0.897 MCC: 0.759 Unknown/abstention proportion: 0.023 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  HIV 0.90 0.81 0.85 64 Healthy/Background 0.93 0.93 0.93 149  Unknown 0.00 0.00 0.00 0  accuracy 0.90 213  macro avg 0.61 0.58 0.59 213  weighted avg 0.92 0.90 0.91 213,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.932 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.932 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.961 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.961 +/- 0.002 (in 3 folds) Accuracy: 0.914 +/- 0.029 (in 3 folds) MCC: 0.795 +/- 0.068 (in 3 folds) Global scores without abstention: Accuracy: 0.914 MCC: 0.791 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.897 +/- 0.018 (in 3 folds) MCC: 0.759 +/- 0.045 (in 3 folds) Unknown/abstention proportion: 0.028 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.922 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.922 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.962 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.962 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.897 MCC: 0.754 Unknown/abstention proportion: 0.019 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  HIV 0.92 0.77 0.84 64 Healthy/Background 0.91 0.95 0.93 149  Unknown 0.00 0.00 0.00 0  accuracy 0.90 213  macro avg 0.61 0.57 0.59 213  weighted avg 0.91 0.90 0.90 213,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.701 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.701 +/- 0.006 (in 3 folds) Accuracy: 0.701 +/- 0.006 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.701 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 2 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 2 folds) au-PRC (weighted OvO): 0.702 +/- 0.009 (in 2 folds) au-PRC (macro OvO): 0.702 +/- 0.009 (in 2 folds) Accuracy: 0.695 +/- 0.014 (in 3 folds) MCC: 0.012 +/- 0.021 (in 3 folds) Unknown/abstention proportion: 0.028 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.695 MCC: 0.021 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  HIV 0.00 0.00 0.00 64 Healthy/Background 0.70 0.99 0.82 149  Unknown 0.00 0.00 0.00 0  accuracy 0.69 213  macro avg 0.23 0.33 0.27 213  weighted avg 0.49 0.69 0.58 213
,,,


dummy_stratified
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.493 +/- 0.051 (in 3 folds) ROC-AUC (macro OvO): 0.493 +/- 0.051 (in 3 folds) au-PRC (weighted OvO): 0.664 +/- 0.029 (in 3 folds) au-PRC (macro OvO): 0.664 +/- 0.029 (in 3 folds) Accuracy: 0.556 +/- 0.039 (in 3 folds) MCC: -0.016 +/- 0.105 (in 3 folds) Global scores without abstention: Accuracy: 0.556 MCC: -0.017 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.469 +/- 0.015 (in 3 folds) MCC: -0.038 +/- 0.091 (in 3 folds) Unknown/abstention proportion: 0.154 +/- 0.046 (in 3 folds) Global scores with abstention: Accuracy: 0.469 MCC: -0.034 Unknown/abstention proportion: 0.155 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  HIV 0.32 0.28 0.30 64 Healthy/Background 0.66 0.55 0.60 149  Unknown 0.00 0.00 0.00 0  accuracy 0.47 213  macro avg 0.33 0.28 0.30 213  weighted avg 0.56 0.47 0.51 213


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.981 +/- 0.013 (in 3 folds),0.981 +/- 0.013 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.805 +/- 0.088 (in 3 folds),0.531 +/- 0.226 (in 3 folds),0.805,0.545,disease.separate_past_exposures,0.777 +/- 0.077 (in 3 folds),0.437 +/- 0.229 (in 3 folds),0.034 +/- 0.010 (in 3 folds),0.777,0.457,0.034,Unknown,disease.separate_past_exposures,308.0,11.0,319.0,0.034483,False,,,,
elasticnet_cv.decision_thresholds_tuned,0.981 +/- 0.013 (in 3 folds),0.981 +/- 0.013 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.932 +/- 0.018 (in 3 folds),0.850 +/- 0.036 (in 3 folds),0.932,0.847,disease.separate_past_exposures,0.900 +/- 0.023 (in 3 folds),0.789 +/- 0.051 (in 3 folds),0.034 +/- 0.010 (in 3 folds),0.9,0.787,0.034,Unknown,disease.separate_past_exposures,308.0,11.0,319.0,0.034483,False,,,,
ridge_cv,0.981 +/- 0.007 (in 3 folds),0.981 +/- 0.007 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.690 +/- 0.004 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.69,0.0,disease.separate_past_exposures,0.683 +/- 0.010 (in 3 folds),-0.026 +/- 0.024 (in 3 folds),0.014 +/- 0.007 (in 2 folds),0.683,-0.032,0.009,Unknown,disease.separate_past_exposures,316.0,3.0,319.0,0.009404,True,0.981 +/- 0.000 (in 1 folds),0.981 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
ridge_cv.decision_thresholds_tuned,0.981 +/- 0.007 (in 3 folds),0.981 +/- 0.007 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.690 +/- 0.004 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.69,0.0,disease.separate_past_exposures,0.683 +/- 0.010 (in 3 folds),-0.026 +/- 0.024 (in 3 folds),0.014 +/- 0.007 (in 2 folds),0.683,-0.032,0.009,Unknown,disease.separate_past_exposures,316.0,3.0,319.0,0.009404,True,0.981 +/- 0.000 (in 1 folds),0.981 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
lasso_cv,0.979 +/- 0.014 (in 3 folds),0.979 +/- 0.014 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.878 +/- 0.023 (in 3 folds),0.718 +/- 0.053 (in 3 folds),0.878,0.716,disease.separate_past_exposures,0.856 +/- 0.022 (in 3 folds),0.659 +/- 0.054 (in 3 folds),0.025 +/- 0.006 (in 3 folds),0.856,0.659,0.025,Unknown,disease.separate_past_exposures,311.0,8.0,319.0,0.025078,False,,,,
lasso_cv.decision_thresholds_tuned,0.979 +/- 0.014 (in 3 folds),0.979 +/- 0.014 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.907 +/- 0.026 (in 3 folds),0.790 +/- 0.071 (in 3 folds),0.907,0.786,disease.separate_past_exposures,0.884 +/- 0.020 (in 3 folds),0.746 +/- 0.063 (in 3 folds),0.025 +/- 0.006 (in 3 folds),0.884,0.743,0.025,Unknown,disease.separate_past_exposures,311.0,8.0,319.0,0.025078,False,,,,
linearsvm_ovr,0.978 +/- 0.010 (in 3 folds),0.978 +/- 0.010 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.911 +/- 0.029 (in 3 folds),0.789 +/- 0.070 (in 3 folds),0.911,0.789,disease.separate_past_exposures,0.900 +/- 0.028 (in 3 folds),0.764 +/- 0.066 (in 3 folds),0.019 +/- 0.000 (in 2 folds),0.9,0.763,0.013,Unknown,disease.separate_past_exposures,315.0,4.0,319.0,0.012539,False,0.982 +/- 0.000 (in 1 folds),0.982 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
linearsvm_ovr.decision_thresholds_tuned,0.978 +/- 0.010 (in 3 folds),0.978 +/- 0.010 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.918 +/- 0.028 (in 3 folds),0.807 +/- 0.071 (in 3 folds),0.917,0.805,disease.separate_past_exposures,0.906 +/- 0.031 (in 3 folds),0.782 +/- 0.075 (in 3 folds),0.019 +/- 0.000 (in 2 folds),0.906,0.779,0.013,Unknown,disease.separate_past_exposures,315.0,4.0,319.0,0.012539,False,0.982 +/- 0.000 (in 1 folds),0.982 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
lasso_multiclass,0.977 +/- 0.013 (in 3 folds),0.977 +/- 0.013 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.908 +/- 0.026 (in 3 folds),0.782 +/- 0.064 (in 3 folds),0.907,0.781,disease.separate_past_exposures,0.890 +/- 0.025 (in 3 folds),0.747 +/- 0.062 (in 3 folds),0.019 +/- 0.000 (in 3 folds),0.89,0.746,0.019,Unknown,disease.separate_past_exposures,313.0,6.0,319.0,0.018809,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.977 +/- 0.013 (in 3 folds),0.977 +/- 0.013 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.917 +/- 0.035 (in 3 folds),0.810 +/- 0.088 (in 3 folds),0.917,0.805,disease.separate_past_exposures,0.900 +/- 0.034 (in 3 folds),0.774 +/- 0.085 (in 3 folds),0.019 +/- 0.000 (in 3 folds),0.9,0.769,0.019,Unknown,disease.separate_past_exposures,313.0,6.0,319.0,0.018809,False,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.981 +/- 0.013 (in 3 folds),0.981 +/- 0.013 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.805 +/- 0.088 (in 3 folds),0.531 +/- 0.226 (in 3 folds),0.805,0.545,disease.separate_past_exposures,0.777 +/- 0.077 (in 3 folds),0.437 +/- 0.229 (in 3 folds),0.034 +/- 0.010 (in 3 folds),0.777,0.457,0.034,Unknown,disease.separate_past_exposures,308,11,319,0.034483,False,,,,
elasticnet_cv.decision_thresholds_tuned,0.981 +/- 0.013 (in 3 folds),0.981 +/- 0.013 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.990 +/- 0.007 (in 3 folds),0.932 +/- 0.018 (in 3 folds),0.850 +/- 0.036 (in 3 folds),0.932,0.847,disease.separate_past_exposures,0.900 +/- 0.023 (in 3 folds),0.789 +/- 0.051 (in 3 folds),0.034 +/- 0.010 (in 3 folds),0.9,0.787,0.034,Unknown,disease.separate_past_exposures,308,11,319,0.034483,False,,,,
ridge_cv,0.981 +/- 0.007 (in 3 folds),0.981 +/- 0.007 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.690 +/- 0.004 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.69,0.0,disease.separate_past_exposures,0.683 +/- 0.010 (in 3 folds),-0.026 +/- 0.024 (in 3 folds),0.014 +/- 0.007 (in 2 folds),0.683,-0.032,0.009,Unknown,disease.separate_past_exposures,316,3,319,0.009404,True,0.981 +/- 0.000 (in 1 folds),0.981 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
ridge_cv.decision_thresholds_tuned,0.981 +/- 0.007 (in 3 folds),0.981 +/- 0.007 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.992 +/- 0.002 (in 3 folds),0.690 +/- 0.004 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.69,0.0,disease.separate_past_exposures,0.683 +/- 0.010 (in 3 folds),-0.026 +/- 0.024 (in 3 folds),0.014 +/- 0.007 (in 2 folds),0.683,-0.032,0.009,Unknown,disease.separate_past_exposures,316,3,319,0.009404,True,0.981 +/- 0.000 (in 1 folds),0.981 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
lasso_cv,0.979 +/- 0.014 (in 3 folds),0.979 +/- 0.014 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.878 +/- 0.023 (in 3 folds),0.718 +/- 0.053 (in 3 folds),0.878,0.716,disease.separate_past_exposures,0.856 +/- 0.022 (in 3 folds),0.659 +/- 0.054 (in 3 folds),0.025 +/- 0.006 (in 3 folds),0.856,0.659,0.025,Unknown,disease.separate_past_exposures,311,8,319,0.025078,False,,,,
lasso_cv.decision_thresholds_tuned,0.979 +/- 0.014 (in 3 folds),0.979 +/- 0.014 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.907 +/- 0.026 (in 3 folds),0.790 +/- 0.071 (in 3 folds),0.907,0.786,disease.separate_past_exposures,0.884 +/- 0.020 (in 3 folds),0.746 +/- 0.063 (in 3 folds),0.025 +/- 0.006 (in 3 folds),0.884,0.743,0.025,Unknown,disease.separate_past_exposures,311,8,319,0.025078,False,,,,
linearsvm_ovr,0.978 +/- 0.010 (in 3 folds),0.978 +/- 0.010 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.911 +/- 0.029 (in 3 folds),0.789 +/- 0.070 (in 3 folds),0.911,0.789,disease.separate_past_exposures,0.900 +/- 0.028 (in 3 folds),0.764 +/- 0.066 (in 3 folds),0.019 +/- 0.000 (in 2 folds),0.9,0.763,0.013,Unknown,disease.separate_past_exposures,315,4,319,0.012539,False,0.982 +/- 0.000 (in 1 folds),0.982 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
linearsvm_ovr.decision_thresholds_tuned,0.978 +/- 0.010 (in 3 folds),0.978 +/- 0.010 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.990 +/- 0.004 (in 3 folds),0.918 +/- 0.028 (in 3 folds),0.807 +/- 0.071 (in 3 folds),0.917,0.805,disease.separate_past_exposures,0.906 +/- 0.031 (in 3 folds),0.782 +/- 0.075 (in 3 folds),0.019 +/- 0.000 (in 2 folds),0.906,0.779,0.013,Unknown,disease.separate_past_exposures,315,4,319,0.012539,False,0.982 +/- 0.000 (in 1 folds),0.982 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds),0.992 +/- 0.000 (in 1 folds)
lasso_multiclass,0.977 +/- 0.013 (in 3 folds),0.977 +/- 0.013 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.908 +/- 0.026 (in 3 folds),0.782 +/- 0.064 (in 3 folds),0.907,0.781,disease.separate_past_exposures,0.890 +/- 0.025 (in 3 folds),0.747 +/- 0.062 (in 3 folds),0.019 +/- 0.000 (in 3 folds),0.89,0.746,0.019,Unknown,disease.separate_past_exposures,313,6,319,0.018809,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.977 +/- 0.013 (in 3 folds),0.977 +/- 0.013 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.990 +/- 0.006 (in 3 folds),0.917 +/- 0.035 (in 3 folds),0.810 +/- 0.088 (in 3 folds),0.917,0.805,disease.separate_past_exposures,0.900 +/- 0.034 (in 3 folds),0.774 +/- 0.085 (in 3 folds),0.019 +/- 0.000 (in 3 folds),0.9,0.769,0.019,Unknown,disease.separate_past_exposures,313,6,319,0.018809,False,,,,


elasticnet_cv,elasticnet_cv.decision_thresholds_tuned,ridge_cv,ridge_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.981 +/- 0.013 (in 3 folds) ROC-AUC (macro OvO): 0.981 +/- 0.013 (in 3 folds) au-PRC (weighted OvO): 0.990 +/- 0.007 (in 3 folds) au-PRC (macro OvO): 0.990 +/- 0.007 (in 3 folds) Accuracy: 0.805 +/- 0.088 (in 3 folds) MCC: 0.531 +/- 0.226 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.805 MCC: 0.545 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.777 +/- 0.077 (in 3 folds) MCC: 0.437 +/- 0.229 (in 3 folds) Unknown/abstention proportion: 0.034 +/- 0.010 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.777 MCC: 0.457 Unknown/abstention proportion: 0.034 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.97 0.40 0.57 98 Healthy/Background 0.78 0.95 0.85 221  Unknown 0.00 0.00 0.00 0  accuracy 0.78 319  macro avg 0.58 0.45 0.47 319  weighted avg 0.84 0.78 0.77 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.981 +/- 0.013 (in 3 folds) ROC-AUC (macro OvO): 0.981 +/- 0.013 (in 3 folds) au-PRC (weighted OvO): 0.990 +/- 0.007 (in 3 folds) au-PRC (macro OvO): 0.990 +/- 0.007 (in 3 folds) Accuracy: 0.932 +/- 0.018 (in 3 folds) MCC: 0.850 +/- 0.036 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.932 MCC: 0.847 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.900 +/- 0.023 (in 3 folds) MCC: 0.789 +/- 0.051 (in 3 folds) Unknown/abstention proportion: 0.034 +/- 0.010 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.900 MCC: 0.787 Unknown/abstention proportion: 0.034 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.87 0.93 0.90 98 Healthy/Background 0.97 0.89 0.92 221  Unknown 0.00 0.00 0.00 0  accuracy 0.90 319  macro avg 0.61 0.61 0.61 319  weighted avg 0.94 0.90 0.92 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.981 +/- 0.007 (in 3 folds) ROC-AUC (macro OvO): 0.981 +/- 0.007 (in 3 folds) au-PRC (weighted OvO): 0.992 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.992 +/- 0.002 (in 3 folds) Accuracy: 0.690 +/- 0.004 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.690 MCC: 0.000 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.683 +/- 0.010 (in 3 folds) MCC: -0.026 +/- 0.024 (in 3 folds) Unknown/abstention proportion: 0.014 +/- 0.007 (in 2 folds) ROC-AUC (weighted OvO): 0.981 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.981 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.992 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.992 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.683 MCC: -0.032 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.00 0.00 0.00 98 Healthy/Background 0.69 0.99 0.81 221  Unknown 0.00 0.00 0.00 0  accuracy 0.68 319  macro avg 0.23 0.33 0.27 319  weighted avg 0.48 0.68 0.56 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.981 +/- 0.007 (in 3 folds) ROC-AUC (macro OvO): 0.981 +/- 0.007 (in 3 folds) au-PRC (weighted OvO): 0.992 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.992 +/- 0.002 (in 3 folds) Accuracy: 0.690 +/- 0.004 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.690 MCC: 0.000 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.683 +/- 0.010 (in 3 folds) MCC: -0.026 +/- 0.024 (in 3 folds) Unknown/abstention proportion: 0.014 +/- 0.007 (in 2 folds) ROC-AUC (weighted OvO): 0.981 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.981 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.992 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.992 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.683 MCC: -0.032 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.00 0.00 0.00 98 Healthy/Background 0.69 0.99 0.81 221  Unknown 0.00 0.00 0.00 0  accuracy 0.68 319  macro avg 0.23 0.33 0.27 319  weighted avg 0.48 0.68 0.56 319
,,,


lasso_cv,lasso_cv.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.979 +/- 0.014 (in 3 folds) ROC-AUC (macro OvO): 0.979 +/- 0.014 (in 3 folds) au-PRC (weighted OvO): 0.990 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.990 +/- 0.006 (in 3 folds) Accuracy: 0.878 +/- 0.023 (in 3 folds) MCC: 0.718 +/- 0.053 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.878 MCC: 0.716 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.856 +/- 0.022 (in 3 folds) MCC: 0.659 +/- 0.054 (in 3 folds) Unknown/abstention proportion: 0.025 +/- 0.006 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.856 MCC: 0.659 Unknown/abstention proportion: 0.025 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.97 0.63 0.77 98 Healthy/Background 0.85 0.95 0.90 221  Unknown 0.00 0.00 0.00 0  accuracy 0.86 319  macro avg 0.61 0.53 0.56 319  weighted avg 0.89 0.86 0.86 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.979 +/- 0.014 (in 3 folds) ROC-AUC (macro OvO): 0.979 +/- 0.014 (in 3 folds) au-PRC (weighted OvO): 0.990 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.990 +/- 0.006 (in 3 folds) Accuracy: 0.907 +/- 0.026 (in 3 folds) MCC: 0.790 +/- 0.071 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.907 MCC: 0.786 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.884 +/- 0.020 (in 3 folds) MCC: 0.746 +/- 0.063 (in 3 folds) Unknown/abstention proportion: 0.025 +/- 0.006 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.884 MCC: 0.743 Unknown/abstention proportion: 0.025 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.84 0.87 0.85 98 Healthy/Background 0.94 0.89 0.91 221  Unknown 0.00 0.00 0.00 0  accuracy 0.88 319  macro avg 0.59 0.59 0.59 319  weighted avg 0.91 0.88 0.90 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.978 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.978 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.990 +/- 0.004 (in 3 folds) au-PRC (macro OvO): 0.990 +/- 0.004 (in 3 folds) Accuracy: 0.911 +/- 0.029 (in 3 folds) MCC: 0.789 +/- 0.070 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.911 MCC: 0.789 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.900 +/- 0.028 (in 3 folds) MCC: 0.764 +/- 0.066 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.982 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.982 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.992 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.992 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.900 MCC: 0.763 Unknown/abstention proportion: 0.013 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.92 0.79 0.85 98 Healthy/Background 0.91 0.95 0.93 221  Unknown 0.00 0.00 0.00 0  accuracy 0.90 319  macro avg 0.61 0.58 0.59 319  weighted avg 0.91 0.90 0.90 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.978 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.978 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.990 +/- 0.004 (in 3 folds) au-PRC (macro OvO): 0.990 +/- 0.004 (in 3 folds) Accuracy: 0.918 +/- 0.028 (in 3 folds) MCC: 0.807 +/- 0.071 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.917 MCC: 0.805 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.906 +/- 0.031 (in 3 folds) MCC: 0.782 +/- 0.075 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.982 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.982 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.992 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.992 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.906 MCC: 0.779 Unknown/abstention proportion: 0.013 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.90 0.83 0.86 98 Healthy/Background 0.92 0.94 0.93 221  Unknown 0.00 0.00 0.00 0  accuracy 0.91 319  macro avg 0.61 0.59 0.60 319  weighted avg 0.92 0.91 0.91 319
,,,


lasso_multiclass,lasso_multiclass.decision_thresholds_tuned,rf_multiclass,rf_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.977 +/- 0.013 (in 3 folds) ROC-AUC (macro OvO): 0.977 +/- 0.013 (in 3 folds) au-PRC (weighted OvO): 0.990 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.990 +/- 0.006 (in 3 folds) Accuracy: 0.908 +/- 0.026 (in 3 folds) MCC: 0.782 +/- 0.064 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.907 MCC: 0.781 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.890 +/- 0.025 (in 3 folds) MCC: 0.747 +/- 0.062 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.000 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.890 MCC: 0.746 Unknown/abstention proportion: 0.019 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.88 0.82 0.85 98 Healthy/Background 0.92 0.92 0.92 221  Unknown 0.00 0.00 0.00 0  accuracy 0.89 319  macro avg 0.60 0.58 0.59 319  weighted avg 0.91 0.89 0.90 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.977 +/- 0.013 (in 3 folds) ROC-AUC (macro OvO): 0.977 +/- 0.013 (in 3 folds) au-PRC (weighted OvO): 0.990 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.990 +/- 0.006 (in 3 folds) Accuracy: 0.917 +/- 0.035 (in 3 folds) MCC: 0.810 +/- 0.088 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.917 MCC: 0.805 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.900 +/- 0.034 (in 3 folds) MCC: 0.774 +/- 0.085 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.000 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.900 MCC: 0.769 Unknown/abstention proportion: 0.019 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.88 0.85 0.86 98 Healthy/Background 0.93 0.92 0.93 221  Unknown 0.00 0.00 0.00 0  accuracy 0.90 319  macro avg 0.60 0.59 0.60 319  weighted avg 0.92 0.90 0.91 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.956 +/- 0.025 (in 3 folds) ROC-AUC (macro OvO): 0.956 +/- 0.025 (in 3 folds) au-PRC (weighted OvO): 0.977 +/- 0.012 (in 3 folds) au-PRC (macro OvO): 0.977 +/- 0.012 (in 3 folds) Accuracy: 0.896 +/- 0.056 (in 3 folds) MCC: 0.752 +/- 0.136 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.895 MCC: 0.751 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.881 +/- 0.050 (in 3 folds) MCC: 0.718 +/- 0.127 (in 3 folds) Unknown/abstention proportion: 0.016 +/- 0.006 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.881 MCC: 0.717 Unknown/abstention proportion: 0.016 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.93 0.71 0.81 98 Healthy/Background 0.88 0.95 0.92 221  Unknown 0.00 0.00 0.00 0  accuracy 0.88 319  macro avg 0.61 0.56 0.58 319  weighted avg 0.90 0.88 0.88 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.956 +/- 0.025 (in 3 folds) ROC-AUC (macro OvO): 0.956 +/- 0.025 (in 3 folds) au-PRC (weighted OvO): 0.977 +/- 0.012 (in 3 folds) au-PRC (macro OvO): 0.977 +/- 0.012 (in 3 folds) Accuracy: 0.902 +/- 0.036 (in 3 folds) MCC: 0.773 +/- 0.096 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.901 MCC: 0.766 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.887 +/- 0.031 (in 3 folds) MCC: 0.741 +/- 0.088 (in 3 folds) Unknown/abstention proportion: 0.016 +/- 0.006 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.887 MCC: 0.735 Unknown/abstention proportion: 0.016 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.89 0.79 0.83 98 Healthy/Background 0.91 0.93 0.92 221  Unknown 0.00 0.00 0.00 0  accuracy 0.89 319  macro avg 0.60 0.57 0.58 319  weighted avg 0.90 0.89 0.89 319
,,,


xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.953 +/- 0.036 (in 3 folds) ROC-AUC (macro OvO): 0.953 +/- 0.036 (in 3 folds) au-PRC (weighted OvO): 0.976 +/- 0.017 (in 3 folds) au-PRC (macro OvO): 0.976 +/- 0.017 (in 3 folds) Accuracy: 0.901 +/- 0.033 (in 3 folds) MCC: 0.766 +/- 0.081 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.901 MCC: 0.765 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.884 +/- 0.032 (in 3 folds) MCC: 0.730 +/- 0.078 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.000 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.884 MCC: 0.729 Unknown/abstention proportion: 0.019 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.89 0.79 0.83 98 Healthy/Background 0.91 0.93 0.92 221  Unknown 0.00 0.00 0.00 0  accuracy 0.88 319  macro avg 0.60 0.57 0.58 319  weighted avg 0.90 0.88 0.89 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.953 +/- 0.036 (in 3 folds) ROC-AUC (macro OvO): 0.953 +/- 0.036 (in 3 folds) au-PRC (weighted OvO): 0.976 +/- 0.017 (in 3 folds) au-PRC (macro OvO): 0.976 +/- 0.017 (in 3 folds) Accuracy: 0.901 +/- 0.039 (in 3 folds) MCC: 0.773 +/- 0.094 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.901 MCC: 0.769 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.884 +/- 0.038 (in 3 folds) MCC: 0.739 +/- 0.089 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.000 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.884 MCC: 0.736 Unknown/abstention proportion: 0.019 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.85 0.84 0.84 98 Healthy/Background 0.93 0.90 0.92 221  Unknown 0.00 0.00 0.00 0  accuracy 0.88 319  macro avg 0.59 0.58 0.59 319  weighted avg 0.90 0.88 0.89 319
,


---

# GeneLocus.BCR, TargetObsColumnEnum.lupus_vs_healthy trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.863 +/- 0.029 (in 3 folds),0.863 +/- 0.029 (in 3 folds),0.739 +/- 0.118 (in 3 folds),0.739 +/- 0.118 (in 3 folds),0.747 +/- 0.046 (in 3 folds),0.389 +/- 0.152 (in 3 folds),0.747,0.387,0.541 +/- 0.136 (in 3 folds),0.206 +/- 0.136 (in 3 folds),0.275 +/- 0.183 (in 3 folds),0.544,0.206,0.272,Unknown,158.0,59.0,217.0,0.271889,False,,,,
linearsvm_ovr,0.863 +/- 0.016 (in 3 folds),0.863 +/- 0.016 (in 3 folds),0.780 +/- 0.027 (in 3 folds),0.780 +/- 0.027 (in 3 folds),0.821 +/- 0.060 (in 3 folds),0.581 +/- 0.141 (in 3 folds),0.821,0.576,0.802 +/- 0.035 (in 3 folds),0.547 +/- 0.098 (in 3 folds),0.034 +/- 0.028 (in 2 folds),0.802,0.545,0.023,Unknown,212.0,5.0,217.0,0.023041,False,0.853 +/- 0.000 (in 1 folds),0.853 +/- 0.000 (in 1 folds),0.787 +/- 0.000 (in 1 folds),0.787 +/- 0.000 (in 1 folds)
lasso_cv,0.862 +/- 0.035 (in 3 folds),0.862 +/- 0.035 (in 3 folds),0.766 +/- 0.075 (in 3 folds),0.766 +/- 0.075 (in 3 folds),0.764 +/- 0.031 (in 3 folds),0.436 +/- 0.111 (in 3 folds),0.762,0.424,0.650 +/- 0.043 (in 3 folds),0.259 +/- 0.090 (in 3 folds),0.147 +/- 0.087 (in 3 folds),0.65,0.271,0.147,Unknown,185.0,32.0,217.0,0.147465,False,,,,
lasso_multiclass,0.859 +/- 0.022 (in 3 folds),0.859 +/- 0.022 (in 3 folds),0.771 +/- 0.036 (in 3 folds),0.771 +/- 0.036 (in 3 folds),0.821 +/- 0.060 (in 3 folds),0.581 +/- 0.141 (in 3 folds),0.821,0.576,0.802 +/- 0.035 (in 3 folds),0.547 +/- 0.098 (in 3 folds),0.034 +/- 0.028 (in 2 folds),0.802,0.545,0.023,Unknown,212.0,5.0,217.0,0.023041,False,0.849 +/- 0.000 (in 1 folds),0.849 +/- 0.000 (in 1 folds),0.773 +/- 0.000 (in 1 folds),0.773 +/- 0.000 (in 1 folds)
rf_multiclass,0.829 +/- 0.034 (in 3 folds),0.829 +/- 0.034 (in 3 folds),0.759 +/- 0.071 (in 3 folds),0.759 +/- 0.071 (in 3 folds),0.808 +/- 0.059 (in 3 folds),0.557 +/- 0.143 (in 3 folds),0.809,0.549,0.723 +/- 0.112 (in 3 folds),0.452 +/- 0.128 (in 3 folds),0.105 +/- 0.124 (in 3 folds),0.724,0.436,0.106,Unknown,194.0,23.0,217.0,0.105991,False,,,,
xgboost,0.818 +/- 0.037 (in 3 folds),0.818 +/- 0.037 (in 3 folds),0.735 +/- 0.103 (in 3 folds),0.735 +/- 0.103 (in 3 folds),0.828 +/- 0.038 (in 3 folds),0.604 +/- 0.080 (in 3 folds),0.831,0.602,0.723 +/- 0.112 (in 3 folds),0.469 +/- 0.120 (in 3 folds),0.129 +/- 0.103 (in 3 folds),0.724,0.453,0.129,Unknown,189.0,28.0,217.0,0.129032,False,,,,
ridge_cv,0.746 +/- 0.219 (in 3 folds),0.746 +/- 0.219 (in 3 folds),0.538 +/- 0.244 (in 3 folds),0.538 +/- 0.244 (in 3 folds),0.709 +/- 0.019 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.707,0.0,0.323 +/- 0.057 (in 3 folds),0.016 +/- 0.037 (in 3 folds),0.543 +/- 0.090 (in 3 folds),0.323,0.02,0.544,Unknown,99.0,118.0,217.0,0.543779,True,,,,
dummy_stratified,0.541 +/- 0.093 (in 3 folds),0.541 +/- 0.093 (in 3 folds),0.348 +/- 0.045 (in 3 folds),0.348 +/- 0.045 (in 3 folds),0.550 +/- 0.075 (in 3 folds),0.072 +/- 0.167 (in 3 folds),0.536,0.046,0.272 +/- 0.046 (in 3 folds),0.019 +/- 0.060 (in 3 folds),0.493 +/- 0.141 (in 3 folds),0.272,0.019,0.493,Unknown,110.0,107.0,217.0,0.493088,False,,,,
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.291 +/- 0.019 (in 3 folds),0.291 +/- 0.019 (in 3 folds),0.709 +/- 0.019 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.707,0.0,0.323 +/- 0.057 (in 3 folds),0.016 +/- 0.037 (in 3 folds),0.543 +/- 0.090 (in 3 folds),0.323,0.02,0.544,Unknown,99.0,118.0,217.0,0.543779,True,,,,
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
elasticnet_cv,0.863 +/- 0.029 (in 3 folds),0.863 +/- 0.029 (in 3 folds),0.739 +/- 0.118 (in 3 folds),0.739 +/- 0.118 (in 3 folds),0.747 +/- 0.046 (in 3 folds),0.389 +/- 0.152 (in 3 folds),0.747,0.387,0.541 +/- 0.136 (in 3 folds),0.206 +/- 0.136 (in 3 folds),0.275 +/- 0.183 (in 3 folds),0.544,0.206,0.272,Unknown,158,59,217,0.271889,False,,,,
linearsvm_ovr,0.863 +/- 0.016 (in 3 folds),0.863 +/- 0.016 (in 3 folds),0.780 +/- 0.027 (in 3 folds),0.780 +/- 0.027 (in 3 folds),0.821 +/- 0.060 (in 3 folds),0.581 +/- 0.141 (in 3 folds),0.821,0.576,0.802 +/- 0.035 (in 3 folds),0.547 +/- 0.098 (in 3 folds),0.034 +/- 0.028 (in 2 folds),0.802,0.545,0.023,Unknown,212,5,217,0.023041,False,0.853 +/- 0.000 (in 1 folds),0.853 +/- 0.000 (in 1 folds),0.787 +/- 0.000 (in 1 folds),0.787 +/- 0.000 (in 1 folds)
lasso_cv,0.862 +/- 0.035 (in 3 folds),0.862 +/- 0.035 (in 3 folds),0.766 +/- 0.075 (in 3 folds),0.766 +/- 0.075 (in 3 folds),0.764 +/- 0.031 (in 3 folds),0.436 +/- 0.111 (in 3 folds),0.762,0.424,0.650 +/- 0.043 (in 3 folds),0.259 +/- 0.090 (in 3 folds),0.147 +/- 0.087 (in 3 folds),0.65,0.271,0.147,Unknown,185,32,217,0.147465,False,,,,
lasso_multiclass,0.859 +/- 0.022 (in 3 folds),0.859 +/- 0.022 (in 3 folds),0.771 +/- 0.036 (in 3 folds),0.771 +/- 0.036 (in 3 folds),0.821 +/- 0.060 (in 3 folds),0.581 +/- 0.141 (in 3 folds),0.821,0.576,0.802 +/- 0.035 (in 3 folds),0.547 +/- 0.098 (in 3 folds),0.034 +/- 0.028 (in 2 folds),0.802,0.545,0.023,Unknown,212,5,217,0.023041,False,0.849 +/- 0.000 (in 1 folds),0.849 +/- 0.000 (in 1 folds),0.773 +/- 0.000 (in 1 folds),0.773 +/- 0.000 (in 1 folds)
rf_multiclass,0.829 +/- 0.034 (in 3 folds),0.829 +/- 0.034 (in 3 folds),0.759 +/- 0.071 (in 3 folds),0.759 +/- 0.071 (in 3 folds),0.808 +/- 0.059 (in 3 folds),0.557 +/- 0.143 (in 3 folds),0.809,0.549,0.723 +/- 0.112 (in 3 folds),0.452 +/- 0.128 (in 3 folds),0.105 +/- 0.124 (in 3 folds),0.724,0.436,0.106,Unknown,194,23,217,0.105991,False,,,,
xgboost,0.818 +/- 0.037 (in 3 folds),0.818 +/- 0.037 (in 3 folds),0.735 +/- 0.103 (in 3 folds),0.735 +/- 0.103 (in 3 folds),0.828 +/- 0.038 (in 3 folds),0.604 +/- 0.080 (in 3 folds),0.831,0.602,0.723 +/- 0.112 (in 3 folds),0.469 +/- 0.120 (in 3 folds),0.129 +/- 0.103 (in 3 folds),0.724,0.453,0.129,Unknown,189,28,217,0.129032,False,,,,
ridge_cv,0.746 +/- 0.219 (in 3 folds),0.746 +/- 0.219 (in 3 folds),0.538 +/- 0.244 (in 3 folds),0.538 +/- 0.244 (in 3 folds),0.709 +/- 0.019 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.707,0.0,0.323 +/- 0.057 (in 3 folds),0.016 +/- 0.037 (in 3 folds),0.543 +/- 0.090 (in 3 folds),0.323,0.02,0.544,Unknown,99,118,217,0.543779,True,,,,
dummy_stratified,0.541 +/- 0.093 (in 3 folds),0.541 +/- 0.093 (in 3 folds),0.348 +/- 0.045 (in 3 folds),0.348 +/- 0.045 (in 3 folds),0.550 +/- 0.075 (in 3 folds),0.072 +/- 0.167 (in 3 folds),0.536,0.046,0.272 +/- 0.046 (in 3 folds),0.019 +/- 0.060 (in 3 folds),0.493 +/- 0.141 (in 3 folds),0.272,0.019,0.493,Unknown,110,107,217,0.493088,False,,,,
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.291 +/- 0.019 (in 3 folds),0.291 +/- 0.019 (in 3 folds),0.709 +/- 0.019 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.707,0.0,0.323 +/- 0.057 (in 3 folds),0.016 +/- 0.037 (in 3 folds),0.543 +/- 0.090 (in 3 folds),0.323,0.02,0.544,Unknown,99,118,217,0.543779,True,,,,


elasticnet_cv,linearsvm_ovr,lasso_cv,lasso_multiclass
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.863 +/- 0.029 (in 3 folds) ROC-AUC (macro OvO): 0.863 +/- 0.029 (in 3 folds) au-PRC (weighted OvO): 0.739 +/- 0.118 (in 3 folds) au-PRC (macro OvO): 0.739 +/- 0.118 (in 3 folds) Accuracy: 0.747 +/- 0.046 (in 3 folds) MCC: 0.389 +/- 0.152 (in 3 folds) Global scores without abstention: Accuracy: 0.747 MCC: 0.387 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.541 +/- 0.136 (in 3 folds) MCC: 0.206 +/- 0.136 (in 3 folds) Unknown/abstention proportion: 0.275 +/- 0.183 (in 3 folds) Global scores with abstention: Accuracy: 0.544 MCC: 0.206 Unknown/abstention proportion: 0.272 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.77 0.64 0.70 149  Lupus 0.68 0.34 0.45 68  Unknown 0.00 0.00 0.00 0  accuracy 0.54 217  macro avg 0.48 0.33 0.38 217  weighted avg 0.74 0.54 0.62 217,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.863 +/- 0.016 (in 3 folds) ROC-AUC (macro OvO): 0.863 +/- 0.016 (in 3 folds) au-PRC (weighted OvO): 0.780 +/- 0.027 (in 3 folds) au-PRC (macro OvO): 0.780 +/- 0.027 (in 3 folds) Accuracy: 0.821 +/- 0.060 (in 3 folds) MCC: 0.581 +/- 0.141 (in 3 folds) Global scores without abstention: Accuracy: 0.821 MCC: 0.576 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.802 +/- 0.035 (in 3 folds) MCC: 0.547 +/- 0.098 (in 3 folds) Unknown/abstention proportion: 0.034 +/- 0.028 (in 2 folds) ROC-AUC (weighted OvO): 0.853 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.853 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.787 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.787 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.802 MCC: 0.545 Unknown/abstention proportion: 0.023 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.85 0.87 0.86 149  Lupus 0.74 0.66 0.70 68  Unknown 0.00 0.00 0.00 0  accuracy 0.80 217  macro avg 0.53 0.51 0.52 217  weighted avg 0.82 0.80 0.81 217,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.862 +/- 0.035 (in 3 folds) ROC-AUC (macro OvO): 0.862 +/- 0.035 (in 3 folds) au-PRC (weighted OvO): 0.766 +/- 0.075 (in 3 folds) au-PRC (macro OvO): 0.766 +/- 0.075 (in 3 folds) Accuracy: 0.764 +/- 0.031 (in 3 folds) MCC: 0.436 +/- 0.111 (in 3 folds) Global scores without abstention: Accuracy: 0.762 MCC: 0.424 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.650 +/- 0.043 (in 3 folds) MCC: 0.259 +/- 0.090 (in 3 folds) Unknown/abstention proportion: 0.147 +/- 0.087 (in 3 folds) Global scores with abstention: Accuracy: 0.650 MCC: 0.271 Unknown/abstention proportion: 0.147 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.76 0.78 0.77 149  Lupus 0.76 0.37 0.50 68  Unknown 0.00 0.00 0.00 0  accuracy 0.65 217  macro avg 0.51 0.38 0.42 217  weighted avg 0.76 0.65 0.68 217,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.859 +/- 0.022 (in 3 folds) ROC-AUC (macro OvO): 0.859 +/- 0.022 (in 3 folds) au-PRC (weighted OvO): 0.771 +/- 0.036 (in 3 folds) au-PRC (macro OvO): 0.771 +/- 0.036 (in 3 folds) Accuracy: 0.821 +/- 0.060 (in 3 folds) MCC: 0.581 +/- 0.141 (in 3 folds) Global scores without abstention: Accuracy: 0.821 MCC: 0.576 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.802 +/- 0.035 (in 3 folds) MCC: 0.547 +/- 0.098 (in 3 folds) Unknown/abstention proportion: 0.034 +/- 0.028 (in 2 folds) ROC-AUC (weighted OvO): 0.849 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.849 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.773 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.773 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.802 MCC: 0.545 Unknown/abstention proportion: 0.023 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.85 0.87 0.86 149  Lupus 0.74 0.66 0.70 68  Unknown 0.00 0.00 0.00 0  accuracy 0.80 217  macro avg 0.53 0.51 0.52 217  weighted avg 0.82 0.80 0.81 217
,,,


rf_multiclass,xgboost,ridge_cv,dummy_stratified
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.829 +/- 0.034 (in 3 folds) ROC-AUC (macro OvO): 0.829 +/- 0.034 (in 3 folds) au-PRC (weighted OvO): 0.759 +/- 0.071 (in 3 folds) au-PRC (macro OvO): 0.759 +/- 0.071 (in 3 folds) Accuracy: 0.808 +/- 0.059 (in 3 folds) MCC: 0.557 +/- 0.143 (in 3 folds) Global scores without abstention: Accuracy: 0.809 MCC: 0.549 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.723 +/- 0.112 (in 3 folds) MCC: 0.452 +/- 0.128 (in 3 folds) Unknown/abstention proportion: 0.105 +/- 0.124 (in 3 folds) Global scores with abstention: Accuracy: 0.724 MCC: 0.436 Unknown/abstention proportion: 0.106 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.85 0.79 0.82 149  Lupus 0.71 0.59 0.65 68  Unknown 0.00 0.00 0.00 0  accuracy 0.72 217  macro avg 0.52 0.46 0.49 217  weighted avg 0.81 0.72 0.76 217,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.818 +/- 0.037 (in 3 folds) ROC-AUC (macro OvO): 0.818 +/- 0.037 (in 3 folds) au-PRC (weighted OvO): 0.735 +/- 0.103 (in 3 folds) au-PRC (macro OvO): 0.735 +/- 0.103 (in 3 folds) Accuracy: 0.828 +/- 0.038 (in 3 folds) MCC: 0.604 +/- 0.080 (in 3 folds) Global scores without abstention: Accuracy: 0.831 MCC: 0.602 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.723 +/- 0.112 (in 3 folds) MCC: 0.469 +/- 0.120 (in 3 folds) Unknown/abstention proportion: 0.129 +/- 0.103 (in 3 folds) Global scores with abstention: Accuracy: 0.724 MCC: 0.453 Unknown/abstention proportion: 0.129 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.85 0.78 0.81 149  Lupus 0.77 0.60 0.68 68  Unknown 0.00 0.00 0.00 0  accuracy 0.72 217  macro avg 0.54 0.46 0.50 217  weighted avg 0.83 0.72 0.77 217,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.746 +/- 0.219 (in 3 folds) ROC-AUC (macro OvO): 0.746 +/- 0.219 (in 3 folds) au-PRC (weighted OvO): 0.538 +/- 0.244 (in 3 folds) au-PRC (macro OvO): 0.538 +/- 0.244 (in 3 folds) Accuracy: 0.709 +/- 0.019 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.707 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.323 +/- 0.057 (in 3 folds) MCC: 0.016 +/- 0.037 (in 3 folds) Unknown/abstention proportion: 0.543 +/- 0.090 (in 3 folds) Global scores with abstention: Accuracy: 0.323 MCC: 0.020 Unknown/abstention proportion: 0.544 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.71 0.47 0.56 149  Lupus 0.00 0.00 0.00 68  Unknown 0.00 0.00 0.00 0  accuracy 0.32 217  macro avg 0.24 0.16 0.19 217  weighted avg 0.49 0.32 0.39 217,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.541 +/- 0.093 (in 3 folds) ROC-AUC (macro OvO): 0.541 +/- 0.093 (in 3 folds) au-PRC (weighted OvO): 0.348 +/- 0.045 (in 3 folds) au-PRC (macro OvO): 0.348 +/- 0.045 (in 3 folds) Accuracy: 0.550 +/- 0.075 (in 3 folds) MCC: 0.072 +/- 0.167 (in 3 folds) Global scores without abstention: Accuracy: 0.536 MCC: 0.046 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.272 +/- 0.046 (in 3 folds) MCC: 0.019 +/- 0.060 (in 3 folds) Unknown/abstention proportion: 0.493 +/- 0.141 (in 3 folds) Global scores with abstention: Accuracy: 0.272 MCC: 0.019 Unknown/abstention proportion: 0.493 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.68 0.28 0.39 149  Lupus 0.36 0.26 0.31 68  Unknown 0.00 0.00 0.00 0  accuracy 0.27 217  macro avg 0.35 0.18 0.23 217  weighted avg 0.58 0.27 0.37 217
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.291 +/- 0.019 (in 3 folds) au-PRC (macro OvO): 0.291 +/- 0.019 (in 3 folds) Accuracy: 0.709 +/- 0.019 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.707 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.323 +/- 0.057 (in 3 folds) MCC: 0.016 +/- 0.037 (in 3 folds) Unknown/abstention proportion: 0.543 +/- 0.090 (in 3 folds) Global scores with abstention: Accuracy: 0.323 MCC: 0.020 Unknown/abstention proportion: 0.544 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.71 0.47 0.56 149  Lupus 0.00 0.00 0.00 68  Unknown 0.00 0.00 0.00 0  accuracy 0.32 217  macro avg 0.24 0.16 0.19 217  weighted avg 0.49 0.32 0.39 217


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.863 +/- 0.042 (in 3 folds),0.863 +/- 0.042 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.769 +/- 0.010 (in 3 folds),0.442 +/- 0.066 (in 3 folds),0.769,0.424,disease.separate_past_exposures,0.575 +/- 0.123 (in 3 folds),0.245 +/- 0.074 (in 3 folds),0.251 +/- 0.160 (in 3 folds),,,,,0.574,0.232,0.254,Unknown,disease.separate_past_exposures,238.0,81.0,319.0,0.253918,False
elasticnet_cv.decision_thresholds_tuned,0.863 +/- 0.042 (in 3 folds),0.863 +/- 0.042 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.804 +/- 0.046 (in 3 folds),0.563 +/- 0.089 (in 3 folds),0.807,0.549,disease.separate_past_exposures,0.604 +/- 0.142 (in 3 folds),0.355 +/- 0.050 (in 3 folds),0.251 +/- 0.160 (in 3 folds),,,,,0.602,0.338,0.254,Unknown,disease.separate_past_exposures,238.0,81.0,319.0,0.253918,False
lasso_cv,0.847 +/- 0.048 (in 3 folds),0.847 +/- 0.048 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.774 +/- 0.026 (in 3 folds),0.457 +/- 0.062 (in 3 folds),0.772,0.421,disease.separate_past_exposures,0.681 +/- 0.077 (in 3 folds),0.325 +/- 0.005 (in 3 folds),0.119 +/- 0.113 (in 3 folds),,,,,0.68,0.292,0.119,Unknown,disease.separate_past_exposures,281.0,38.0,319.0,0.119122,False
lasso_cv.decision_thresholds_tuned,0.847 +/- 0.048 (in 3 folds),0.847 +/- 0.048 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.811 +/- 0.038 (in 3 folds),0.536 +/- 0.099 (in 3 folds),0.808,0.53,disease.separate_past_exposures,0.712 +/- 0.060 (in 3 folds),0.409 +/- 0.044 (in 3 folds),0.119 +/- 0.113 (in 3 folds),,,,,0.712,0.401,0.119,Unknown,disease.separate_past_exposures,281.0,38.0,319.0,0.119122,False
linearsvm_ovr,0.837 +/- 0.002 (in 3 folds),0.837 +/- 0.002 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.776 +/- 0.023 (in 3 folds),0.457 +/- 0.058 (in 3 folds),0.776,0.455,disease.separate_past_exposures,0.758 +/- 0.017 (in 3 folds),0.436 +/- 0.044 (in 3 folds),0.034 +/- 0.021 (in 2 folds),0.836 +/- 0.000 (in 1 folds),0.836 +/- 0.000 (in 1 folds),0.734 +/- 0.000 (in 1 folds),0.734 +/- 0.000 (in 1 folds),0.759,0.435,0.022,Unknown,disease.separate_past_exposures,312.0,7.0,319.0,0.021944,False
linearsvm_ovr.decision_thresholds_tuned,0.837 +/- 0.002 (in 3 folds),0.837 +/- 0.002 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.776 +/- 0.023 (in 3 folds),0.449 +/- 0.050 (in 3 folds),0.776,0.444,disease.separate_past_exposures,0.758 +/- 0.017 (in 3 folds),0.427 +/- 0.032 (in 3 folds),0.034 +/- 0.021 (in 2 folds),0.836 +/- 0.000 (in 1 folds),0.836 +/- 0.000 (in 1 folds),0.734 +/- 0.000 (in 1 folds),0.734 +/- 0.000 (in 1 folds),0.759,0.424,0.022,Unknown,disease.separate_past_exposures,312.0,7.0,319.0,0.021944,False
lasso_multiclass,0.832 +/- 0.008 (in 3 folds),0.832 +/- 0.008 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.776 +/- 0.015 (in 3 folds),0.457 +/- 0.034 (in 3 folds),0.776,0.455,disease.separate_past_exposures,0.758 +/- 0.010 (in 3 folds),0.436 +/- 0.018 (in 3 folds),0.034 +/- 0.021 (in 2 folds),0.828 +/- 0.000 (in 1 folds),0.828 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.759,0.435,0.022,Unknown,disease.separate_past_exposures,312.0,7.0,319.0,0.021944,False
lasso_multiclass.decision_thresholds_tuned,0.832 +/- 0.008 (in 3 folds),0.832 +/- 0.008 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.741 +/- 0.070 (in 3 folds),0.461 +/- 0.017 (in 3 folds),0.74,0.429,disease.separate_past_exposures,0.724 +/- 0.068 (in 3 folds),0.440 +/- 0.012 (in 3 folds),0.034 +/- 0.021 (in 2 folds),0.828 +/- 0.000 (in 1 folds),0.828 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.724,0.411,0.022,Unknown,disease.separate_past_exposures,312.0,7.0,319.0,0.021944,False
xgboost,0.825 +/- 0.057 (in 3 folds),0.825 +/- 0.057 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.764 +/- 0.018 (in 3 folds),0.437 +/- 0.059 (in 3 folds),0.762,0.435,disease.separate_past_exposures,0.684 +/- 0.079 (in 3 folds),0.359 +/- 0.034 (in 3 folds),0.103 +/- 0.121 (in 3 folds),,,,,0.683,0.348,0.103,Unknown,disease.separate_past_exposures,286.0,33.0,319.0,0.103448,False
xgboost.decision_thresholds_tuned,0.825 +/- 0.057 (in 3 folds),0.825 +/- 0.057 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.788 +/- 0.058 (in 3 folds),0.486 +/- 0.143 (in 3 folds),0.783,0.474,disease.separate_past_exposures,0.703 +/- 0.047 (in 3 folds),0.381 +/- 0.016 (in 3 folds),0.103 +/- 0.121 (in 3 folds),,,,,0.702,0.375,0.103,Unknown,disease.separate_past_exposures,286.0,33.0,319.0,0.103448,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.863 +/- 0.042 (in 3 folds),0.863 +/- 0.042 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.769 +/- 0.010 (in 3 folds),0.442 +/- 0.066 (in 3 folds),0.769,0.424,disease.separate_past_exposures,0.575 +/- 0.123 (in 3 folds),0.245 +/- 0.074 (in 3 folds),0.251 +/- 0.160 (in 3 folds),,,,,0.574,0.232,0.254,Unknown,disease.separate_past_exposures,238,81,319,0.253918,False
elasticnet_cv.decision_thresholds_tuned,0.863 +/- 0.042 (in 3 folds),0.863 +/- 0.042 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.745 +/- 0.066 (in 3 folds),0.804 +/- 0.046 (in 3 folds),0.563 +/- 0.089 (in 3 folds),0.807,0.549,disease.separate_past_exposures,0.604 +/- 0.142 (in 3 folds),0.355 +/- 0.050 (in 3 folds),0.251 +/- 0.160 (in 3 folds),,,,,0.602,0.338,0.254,Unknown,disease.separate_past_exposures,238,81,319,0.253918,False
lasso_cv,0.847 +/- 0.048 (in 3 folds),0.847 +/- 0.048 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.774 +/- 0.026 (in 3 folds),0.457 +/- 0.062 (in 3 folds),0.772,0.421,disease.separate_past_exposures,0.681 +/- 0.077 (in 3 folds),0.325 +/- 0.005 (in 3 folds),0.119 +/- 0.113 (in 3 folds),,,,,0.68,0.292,0.119,Unknown,disease.separate_past_exposures,281,38,319,0.119122,False
lasso_cv.decision_thresholds_tuned,0.847 +/- 0.048 (in 3 folds),0.847 +/- 0.048 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.746 +/- 0.066 (in 3 folds),0.811 +/- 0.038 (in 3 folds),0.536 +/- 0.099 (in 3 folds),0.808,0.53,disease.separate_past_exposures,0.712 +/- 0.060 (in 3 folds),0.409 +/- 0.044 (in 3 folds),0.119 +/- 0.113 (in 3 folds),,,,,0.712,0.401,0.119,Unknown,disease.separate_past_exposures,281,38,319,0.119122,False
linearsvm_ovr,0.837 +/- 0.002 (in 3 folds),0.837 +/- 0.002 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.776 +/- 0.023 (in 3 folds),0.457 +/- 0.058 (in 3 folds),0.776,0.455,disease.separate_past_exposures,0.758 +/- 0.017 (in 3 folds),0.436 +/- 0.044 (in 3 folds),0.034 +/- 0.021 (in 2 folds),0.836 +/- 0.000 (in 1 folds),0.836 +/- 0.000 (in 1 folds),0.734 +/- 0.000 (in 1 folds),0.734 +/- 0.000 (in 1 folds),0.759,0.435,0.022,Unknown,disease.separate_past_exposures,312,7,319,0.021944,False
linearsvm_ovr.decision_thresholds_tuned,0.837 +/- 0.002 (in 3 folds),0.837 +/- 0.002 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.727 +/- 0.019 (in 3 folds),0.776 +/- 0.023 (in 3 folds),0.449 +/- 0.050 (in 3 folds),0.776,0.444,disease.separate_past_exposures,0.758 +/- 0.017 (in 3 folds),0.427 +/- 0.032 (in 3 folds),0.034 +/- 0.021 (in 2 folds),0.836 +/- 0.000 (in 1 folds),0.836 +/- 0.000 (in 1 folds),0.734 +/- 0.000 (in 1 folds),0.734 +/- 0.000 (in 1 folds),0.759,0.424,0.022,Unknown,disease.separate_past_exposures,312,7,319,0.021944,False
lasso_multiclass,0.832 +/- 0.008 (in 3 folds),0.832 +/- 0.008 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.776 +/- 0.015 (in 3 folds),0.457 +/- 0.034 (in 3 folds),0.776,0.455,disease.separate_past_exposures,0.758 +/- 0.010 (in 3 folds),0.436 +/- 0.018 (in 3 folds),0.034 +/- 0.021 (in 2 folds),0.828 +/- 0.000 (in 1 folds),0.828 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.759,0.435,0.022,Unknown,disease.separate_past_exposures,312,7,319,0.021944,False
lasso_multiclass.decision_thresholds_tuned,0.832 +/- 0.008 (in 3 folds),0.832 +/- 0.008 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.715 +/- 0.009 (in 3 folds),0.741 +/- 0.070 (in 3 folds),0.461 +/- 0.017 (in 3 folds),0.74,0.429,disease.separate_past_exposures,0.724 +/- 0.068 (in 3 folds),0.440 +/- 0.012 (in 3 folds),0.034 +/- 0.021 (in 2 folds),0.828 +/- 0.000 (in 1 folds),0.828 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.724,0.411,0.022,Unknown,disease.separate_past_exposures,312,7,319,0.021944,False
xgboost,0.825 +/- 0.057 (in 3 folds),0.825 +/- 0.057 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.764 +/- 0.018 (in 3 folds),0.437 +/- 0.059 (in 3 folds),0.762,0.435,disease.separate_past_exposures,0.684 +/- 0.079 (in 3 folds),0.359 +/- 0.034 (in 3 folds),0.103 +/- 0.121 (in 3 folds),,,,,0.683,0.348,0.103,Unknown,disease.separate_past_exposures,286,33,319,0.103448,False
xgboost.decision_thresholds_tuned,0.825 +/- 0.057 (in 3 folds),0.825 +/- 0.057 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.721 +/- 0.078 (in 3 folds),0.788 +/- 0.058 (in 3 folds),0.486 +/- 0.143 (in 3 folds),0.783,0.474,disease.separate_past_exposures,0.703 +/- 0.047 (in 3 folds),0.381 +/- 0.016 (in 3 folds),0.103 +/- 0.121 (in 3 folds),,,,,0.702,0.375,0.103,Unknown,disease.separate_past_exposures,286,33,319,0.103448,False


elasticnet_cv,elasticnet_cv.decision_thresholds_tuned,lasso_cv,lasso_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.863 +/- 0.042 (in 3 folds) ROC-AUC (macro OvO): 0.863 +/- 0.042 (in 3 folds) au-PRC (weighted OvO): 0.745 +/- 0.066 (in 3 folds) au-PRC (macro OvO): 0.745 +/- 0.066 (in 3 folds) Accuracy: 0.769 +/- 0.010 (in 3 folds) MCC: 0.442 +/- 0.066 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.769 MCC: 0.424 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.575 +/- 0.123 (in 3 folds) MCC: 0.245 +/- 0.074 (in 3 folds) Unknown/abstention proportion: 0.251 +/- 0.160 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.574 MCC: 0.232 Unknown/abstention proportion: 0.254 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.78 0.68 0.73 221  Lupus 0.72 0.34 0.46 98  Unknown 0.00 0.00 0.00 0  accuracy 0.57 319  macro avg 0.50 0.34 0.39 319  weighted avg 0.76 0.57 0.64 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.863 +/- 0.042 (in 3 folds) ROC-AUC (macro OvO): 0.863 +/- 0.042 (in 3 folds) au-PRC (weighted OvO): 0.745 +/- 0.066 (in 3 folds) au-PRC (macro OvO): 0.745 +/- 0.066 (in 3 folds) Accuracy: 0.804 +/- 0.046 (in 3 folds) MCC: 0.563 +/- 0.089 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.807 MCC: 0.549 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.604 +/- 0.142 (in 3 folds) MCC: 0.355 +/- 0.050 (in 3 folds) Unknown/abstention proportion: 0.251 +/- 0.160 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.602 MCC: 0.338 Unknown/abstention proportion: 0.254 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.85 0.64 0.73 221  Lupus 0.70 0.52 0.60 98  Unknown 0.00 0.00 0.00 0  accuracy 0.60 319  macro avg 0.52 0.39 0.44 319  weighted avg 0.81 0.60 0.69 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.847 +/- 0.048 (in 3 folds) ROC-AUC (macro OvO): 0.847 +/- 0.048 (in 3 folds) au-PRC (weighted OvO): 0.746 +/- 0.066 (in 3 folds) au-PRC (macro OvO): 0.746 +/- 0.066 (in 3 folds) Accuracy: 0.774 +/- 0.026 (in 3 folds) MCC: 0.457 +/- 0.062 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.772 MCC: 0.421 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.681 +/- 0.077 (in 3 folds) MCC: 0.325 +/- 0.005 (in 3 folds) Unknown/abstention proportion: 0.119 +/- 0.113 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.680 MCC: 0.292 Unknown/abstention proportion: 0.119 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.77 0.83 0.80 221  Lupus 0.77 0.34 0.47 98  Unknown 0.00 0.00 0.00 0  accuracy 0.68 319  macro avg 0.51 0.39 0.42 319  weighted avg 0.77 0.68 0.70 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.847 +/- 0.048 (in 3 folds) ROC-AUC (macro OvO): 0.847 +/- 0.048 (in 3 folds) au-PRC (weighted OvO): 0.746 +/- 0.066 (in 3 folds) au-PRC (macro OvO): 0.746 +/- 0.066 (in 3 folds) Accuracy: 0.811 +/- 0.038 (in 3 folds) MCC: 0.536 +/- 0.099 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.808 MCC: 0.530 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.712 +/- 0.060 (in 3 folds) MCC: 0.409 +/- 0.044 (in 3 folds) Unknown/abstention proportion: 0.119 +/- 0.113 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.712 MCC: 0.401 Unknown/abstention proportion: 0.119 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.83 0.80 0.81 221  Lupus 0.74 0.52 0.61 98  Unknown 0.00 0.00 0.00 0  accuracy 0.71 319  macro avg 0.52 0.44 0.47 319  weighted avg 0.80 0.71 0.75 319
,,,


linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned,lasso_multiclass,lasso_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.837 +/- 0.002 (in 3 folds) ROC-AUC (macro OvO): 0.837 +/- 0.002 (in 3 folds) au-PRC (weighted OvO): 0.727 +/- 0.019 (in 3 folds) au-PRC (macro OvO): 0.727 +/- 0.019 (in 3 folds) Accuracy: 0.776 +/- 0.023 (in 3 folds) MCC: 0.457 +/- 0.058 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.776 MCC: 0.455 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.758 +/- 0.017 (in 3 folds) MCC: 0.436 +/- 0.044 (in 3 folds) Unknown/abstention proportion: 0.034 +/- 0.021 (in 2 folds) ROC-AUC (weighted OvO): 0.836 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.836 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.734 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.734 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.759 MCC: 0.435 Unknown/abstention proportion: 0.022 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.83 0.85 0.84 221  Lupus 0.64 0.56 0.60 98  Unknown 0.00 0.00 0.00 0  accuracy 0.76 319  macro avg 0.49 0.47 0.48 319  weighted avg 0.77 0.76 0.76 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.837 +/- 0.002 (in 3 folds) ROC-AUC (macro OvO): 0.837 +/- 0.002 (in 3 folds) au-PRC (weighted OvO): 0.727 +/- 0.019 (in 3 folds) au-PRC (macro OvO): 0.727 +/- 0.019 (in 3 folds) Accuracy: 0.776 +/- 0.023 (in 3 folds) MCC: 0.449 +/- 0.050 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.776 MCC: 0.444 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.758 +/- 0.017 (in 3 folds) MCC: 0.427 +/- 0.032 (in 3 folds) Unknown/abstention proportion: 0.034 +/- 0.021 (in 2 folds) ROC-AUC (weighted OvO): 0.836 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.836 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.734 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.734 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.759 MCC: 0.424 Unknown/abstention proportion: 0.022 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.82 0.86 0.84 221  Lupus 0.65 0.52 0.58 98  Unknown 0.00 0.00 0.00 0  accuracy 0.76 319  macro avg 0.49 0.46 0.47 319  weighted avg 0.77 0.76 0.76 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.832 +/- 0.008 (in 3 folds) ROC-AUC (macro OvO): 0.832 +/- 0.008 (in 3 folds) au-PRC (weighted OvO): 0.715 +/- 0.009 (in 3 folds) au-PRC (macro OvO): 0.715 +/- 0.009 (in 3 folds) Accuracy: 0.776 +/- 0.015 (in 3 folds) MCC: 0.457 +/- 0.034 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.776 MCC: 0.455 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.758 +/- 0.010 (in 3 folds) MCC: 0.436 +/- 0.018 (in 3 folds) Unknown/abstention proportion: 0.034 +/- 0.021 (in 2 folds) ROC-AUC (weighted OvO): 0.828 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.828 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.711 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.711 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.759 MCC: 0.435 Unknown/abstention proportion: 0.022 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.83 0.85 0.84 221  Lupus 0.64 0.56 0.60 98  Unknown 0.00 0.00 0.00 0  accuracy 0.76 319  macro avg 0.49 0.47 0.48 319  weighted avg 0.77 0.76 0.76 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.832 +/- 0.008 (in 3 folds) ROC-AUC (macro OvO): 0.832 +/- 0.008 (in 3 folds) au-PRC (weighted OvO): 0.715 +/- 0.009 (in 3 folds) au-PRC (macro OvO): 0.715 +/- 0.009 (in 3 folds) Accuracy: 0.741 +/- 0.070 (in 3 folds) MCC: 0.461 +/- 0.017 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.740 MCC: 0.429 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.724 +/- 0.068 (in 3 folds) MCC: 0.440 +/- 0.012 (in 3 folds) Unknown/abstention proportion: 0.034 +/- 0.021 (in 2 folds) ROC-AUC (weighted OvO): 0.828 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.828 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.711 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.711 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.724 MCC: 0.411 Unknown/abstention proportion: 0.022 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.85 0.75 0.80 221  Lupus 0.56 0.66 0.60 98  Unknown 0.00 0.00 0.00 0  accuracy 0.72 319  macro avg 0.47 0.47 0.47 319  weighted avg 0.76 0.72 0.74 319
,,,


xgboost,xgboost.decision_thresholds_tuned,rf_multiclass,rf_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.825 +/- 0.057 (in 3 folds) ROC-AUC (macro OvO): 0.825 +/- 0.057 (in 3 folds) au-PRC (weighted OvO): 0.721 +/- 0.078 (in 3 folds) au-PRC (macro OvO): 0.721 +/- 0.078 (in 3 folds) Accuracy: 0.764 +/- 0.018 (in 3 folds) MCC: 0.437 +/- 0.059 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.762 MCC: 0.435 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.684 +/- 0.079 (in 3 folds) MCC: 0.359 +/- 0.034 (in 3 folds) Unknown/abstention proportion: 0.103 +/- 0.121 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.683 MCC: 0.348 Unknown/abstention proportion: 0.103 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.82 0.75 0.78 221  Lupus 0.62 0.53 0.57 98  Unknown 0.00 0.00 0.00 0  accuracy 0.68 319  macro avg 0.48 0.43 0.45 319  weighted avg 0.76 0.68 0.72 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.825 +/- 0.057 (in 3 folds) ROC-AUC (macro OvO): 0.825 +/- 0.057 (in 3 folds) au-PRC (weighted OvO): 0.721 +/- 0.078 (in 3 folds) au-PRC (macro OvO): 0.721 +/- 0.078 (in 3 folds) Accuracy: 0.788 +/- 0.058 (in 3 folds) MCC: 0.486 +/- 0.143 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.783 MCC: 0.474 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.703 +/- 0.047 (in 3 folds) MCC: 0.381 +/- 0.016 (in 3 folds) Unknown/abstention proportion: 0.103 +/- 0.121 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.702 MCC: 0.375 Unknown/abstention proportion: 0.103 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.82 0.78 0.80 221  Lupus 0.67 0.52 0.59 98  Unknown 0.00 0.00 0.00 0  accuracy 0.70 319  macro avg 0.50 0.43 0.46 319  weighted avg 0.78 0.70 0.74 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.812 +/- 0.074 (in 3 folds) ROC-AUC (macro OvO): 0.812 +/- 0.074 (in 3 folds) au-PRC (weighted OvO): 0.674 +/- 0.113 (in 3 folds) au-PRC (macro OvO): 0.674 +/- 0.113 (in 3 folds) Accuracy: 0.759 +/- 0.025 (in 3 folds) MCC: 0.415 +/- 0.081 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.757 MCC: 0.410 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.684 +/- 0.079 (in 3 folds) MCC: 0.343 +/- 0.020 (in 3 folds) Unknown/abstention proportion: 0.145 +/- 0.136 (in 2 folds) ROC-AUC (weighted OvO): 0.771 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.771 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.591 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.591 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.683 MCC: 0.331 Unknown/abstention proportion: 0.097 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.81 0.77 0.79 221  Lupus 0.62 0.49 0.55 98  Unknown 0.00 0.00 0.00 0  accuracy 0.68 319  macro avg 0.47 0.42 0.44 319  weighted avg 0.75 0.68 0.71 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.812 +/- 0.074 (in 3 folds) ROC-AUC (macro OvO): 0.812 +/- 0.074 (in 3 folds) au-PRC (weighted OvO): 0.674 +/- 0.113 (in 3 folds) au-PRC (macro OvO): 0.674 +/- 0.113 (in 3 folds) Accuracy: 0.763 +/- 0.067 (in 3 folds) MCC: 0.376 +/- 0.224 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.757 MCC: 0.367 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.684 +/- 0.050 (in 3 folds) MCC: 0.282 +/- 0.121 (in 3 folds) Unknown/abstention proportion: 0.145 +/- 0.136 (in 2 folds) ROC-AUC (weighted OvO): 0.771 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.771 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.591 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.591 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.683 MCC: 0.271 Unknown/abstention proportion: 0.097 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.76 0.85 0.81 221  Lupus 0.71 0.31 0.43 98  Unknown 0.00 0.00 0.00 0  accuracy 0.68 319  macro avg 0.49 0.39 0.41 319  weighted avg 0.75 0.68 0.69 319
,,,


ridge_cv,ridge_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.753 +/- 0.225 (in 3 folds) ROC-AUC (macro OvO): 0.753 +/- 0.225 (in 3 folds) au-PRC (weighted OvO): 0.591 +/- 0.281 (in 3 folds) au-PRC (macro OvO): 0.591 +/- 0.281 (in 3 folds) Accuracy: 0.696 +/- 0.041 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.692 MCC: 0.000 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.345 +/- 0.030 (in 3 folds) MCC: -0.000 +/- 0.040 (in 3 folds) Unknown/abstention proportion: 0.502 +/- 0.075 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.345 MCC: -0.001 Unknown/abstention proportion: 0.502 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.69 0.50 0.58 221  Lupus 0.00 0.00 0.00 98  Unknown 0.00 0.00 0.00 0  accuracy 0.34 319  macro avg 0.23 0.17 0.19 319  weighted avg 0.48 0.34 0.40 319,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.753 +/- 0.225 (in 3 folds) ROC-AUC (macro OvO): 0.753 +/- 0.225 (in 3 folds) au-PRC (weighted OvO): 0.591 +/- 0.281 (in 3 folds) au-PRC (macro OvO): 0.591 +/- 0.281 (in 3 folds) Accuracy: 0.557 +/- 0.233 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.566 MCC: -0.024 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.280 +/- 0.128 (in 3 folds) MCC: -0.007 +/- 0.039 (in 3 folds) Unknown/abstention proportion: 0.502 +/- 0.075 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.282 MCC: -0.010 Unknown/abstention proportion: 0.502 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.68 0.34 0.46 221  Lupus 0.29 0.14 0.19 98  Unknown 0.00 0.00 0.00 0  accuracy 0.28 319  macro avg 0.33 0.16 0.22 319  weighted avg 0.56 0.28 0.38 319
,


---

{<TargetObsColumnEnum.disease: TargetObsColumn(obs_column_name='disease', is_target_binary_for_repertoire_composition_classifier=False, limited_to_disease=None, require_metadata_columns_present=None, confusion_matrix_expanded_column_name='disease.separate_past_exposures', blended_evaluation_column_name='disease.rollup')>: PosixPath('/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/disease/train_smaller_model'), <TargetObsColumnEnum.disease_all_demographics_present: TargetObsColumn(obs_column_name='disease', is_target_binary_for_repertoire_composition_classifier=False, limited_to_disease=None, require_metadata_columns_present=['age', 'sex', 'ethnicity_condensed', 'age_group'], confusion_matrix_expanded_column_name='disease.separate_past_exposures', blended_evaluation_column_name='disease.rollup')>: PosixPath('/users/maximz/code/boyd-immune-repertoire-classification/out/convergent_clusters/TCR/disease_all_demographics_present/train_smaller_model'), <Ta

# GeneLocus.TCR, TargetObsColumnEnum.disease trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.923 +/- 0.009 (in 3 folds),0.926 +/- 0.007 (in 3 folds),0.920 +/- 0.013 (in 3 folds),0.927 +/- 0.010 (in 3 folds),0.755 +/- 0.028 (in 3 folds),0.637 +/- 0.048 (in 3 folds),0.755,0.635,274.0,0.0,274.0,0.0,False
lasso_multiclass,0.903 +/- 0.017 (in 3 folds),0.903 +/- 0.024 (in 3 folds),0.901 +/- 0.016 (in 3 folds),0.905 +/- 0.022 (in 3 folds),0.766 +/- 0.031 (in 3 folds),0.665 +/- 0.040 (in 3 folds),0.766,0.662,274.0,0.0,274.0,0.0,False
ridge_cv,0.894 +/- 0.018 (in 3 folds),0.902 +/- 0.018 (in 3 folds),0.879 +/- 0.017 (in 3 folds),0.891 +/- 0.017 (in 3 folds),0.536 +/- 0.069 (in 3 folds),0.209 +/- 0.195 (in 3 folds),0.536,0.253,274.0,0.0,274.0,0.0,False
xgboost,0.891 +/- 0.011 (in 3 folds),0.886 +/- 0.013 (in 3 folds),0.889 +/- 0.011 (in 3 folds),0.890 +/- 0.012 (in 3 folds),0.730 +/- 0.034 (in 3 folds),0.607 +/- 0.050 (in 3 folds),0.73,0.597,274.0,0.0,274.0,0.0,False
lasso_cv,0.881 +/- 0.019 (in 3 folds),0.887 +/- 0.012 (in 3 folds),0.874 +/- 0.017 (in 3 folds),0.884 +/- 0.015 (in 3 folds),0.632 +/- 0.063 (in 3 folds),0.432 +/- 0.105 (in 3 folds),0.631,0.433,274.0,0.0,274.0,0.0,False
rf_multiclass,0.880 +/- 0.018 (in 3 folds),0.882 +/- 0.021 (in 3 folds),0.880 +/- 0.019 (in 3 folds),0.886 +/- 0.020 (in 3 folds),0.715 +/- 0.034 (in 3 folds),0.583 +/- 0.059 (in 3 folds),0.715,0.57,274.0,0.0,274.0,0.0,False
elasticnet_cv,0.863 +/- 0.057 (in 3 folds),0.863 +/- 0.064 (in 3 folds),0.851 +/- 0.054 (in 3 folds),0.856 +/- 0.060 (in 3 folds),0.598 +/- 0.058 (in 3 folds),0.370 +/- 0.106 (in 3 folds),0.599,0.37,274.0,0.0,274.0,0.0,False
dummy_stratified,0.502 +/- 0.017 (in 3 folds),0.509 +/- 0.012 (in 3 folds),0.512 +/- 0.006 (in 3 folds),0.516 +/- 0.005 (in 3 folds),0.336 +/- 0.029 (in 3 folds),-0.003 +/- 0.046 (in 3 folds),0.336,-0.003,274.0,0.0,274.0,0.0,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.474 +/- 0.003 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.474,0.0,274.0,0.0,274.0,0.0,True
"All results, sorted",,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.923 +/- 0.009 (in 3 folds),0.926 +/- 0.007 (in 3 folds),0.920 +/- 0.013 (in 3 folds),0.927 +/- 0.010 (in 3 folds),0.755 +/- 0.028 (in 3 folds),0.637 +/- 0.048 (in 3 folds),0.755,0.635,274,0,274,0.0,False
lasso_multiclass,0.903 +/- 0.017 (in 3 folds),0.903 +/- 0.024 (in 3 folds),0.901 +/- 0.016 (in 3 folds),0.905 +/- 0.022 (in 3 folds),0.766 +/- 0.031 (in 3 folds),0.665 +/- 0.040 (in 3 folds),0.766,0.662,274,0,274,0.0,False
ridge_cv,0.894 +/- 0.018 (in 3 folds),0.902 +/- 0.018 (in 3 folds),0.879 +/- 0.017 (in 3 folds),0.891 +/- 0.017 (in 3 folds),0.536 +/- 0.069 (in 3 folds),0.209 +/- 0.195 (in 3 folds),0.536,0.253,274,0,274,0.0,False
xgboost,0.891 +/- 0.011 (in 3 folds),0.886 +/- 0.013 (in 3 folds),0.889 +/- 0.011 (in 3 folds),0.890 +/- 0.012 (in 3 folds),0.730 +/- 0.034 (in 3 folds),0.607 +/- 0.050 (in 3 folds),0.73,0.597,274,0,274,0.0,False
lasso_cv,0.881 +/- 0.019 (in 3 folds),0.887 +/- 0.012 (in 3 folds),0.874 +/- 0.017 (in 3 folds),0.884 +/- 0.015 (in 3 folds),0.632 +/- 0.063 (in 3 folds),0.432 +/- 0.105 (in 3 folds),0.631,0.433,274,0,274,0.0,False
rf_multiclass,0.880 +/- 0.018 (in 3 folds),0.882 +/- 0.021 (in 3 folds),0.880 +/- 0.019 (in 3 folds),0.886 +/- 0.020 (in 3 folds),0.715 +/- 0.034 (in 3 folds),0.583 +/- 0.059 (in 3 folds),0.715,0.57,274,0,274,0.0,False
elasticnet_cv,0.863 +/- 0.057 (in 3 folds),0.863 +/- 0.064 (in 3 folds),0.851 +/- 0.054 (in 3 folds),0.856 +/- 0.060 (in 3 folds),0.598 +/- 0.058 (in 3 folds),0.370 +/- 0.106 (in 3 folds),0.599,0.37,274,0,274,0.0,False
dummy_stratified,0.502 +/- 0.017 (in 3 folds),0.509 +/- 0.012 (in 3 folds),0.512 +/- 0.006 (in 3 folds),0.516 +/- 0.005 (in 3 folds),0.336 +/- 0.029 (in 3 folds),-0.003 +/- 0.046 (in 3 folds),0.336,-0.003,274,0,274,0.0,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.474 +/- 0.003 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.474,0.0,274,0,274,0.0,True


linearsvm_ovr,lasso_multiclass,ridge_cv,xgboost
Per-fold scores: ROC-AUC (weighted OvO): 0.923 +/- 0.009 (in 3 folds) ROC-AUC (macro OvO): 0.926 +/- 0.007 (in 3 folds) au-PRC (weighted OvO): 0.920 +/- 0.013 (in 3 folds) au-PRC (macro OvO): 0.927 +/- 0.010 (in 3 folds) Accuracy: 0.755 +/- 0.028 (in 3 folds) MCC: 0.637 +/- 0.048 (in 3 folds) Global scores: Accuracy: 0.755 MCC: 0.635 Global classification report:  precision recall f1-score support  Covid19 0.64 0.76 0.70 38  HIV 0.73 0.69 0.71 64 Healthy/Background 0.76 0.84 0.80 130  Lupus 0.96 0.60 0.74 42  accuracy 0.76 274  macro avg 0.78 0.72 0.74 274  weighted avg 0.77 0.76 0.75 274,Per-fold scores: ROC-AUC (weighted OvO): 0.903 +/- 0.017 (in 3 folds) ROC-AUC (macro OvO): 0.903 +/- 0.024 (in 3 folds) au-PRC (weighted OvO): 0.901 +/- 0.016 (in 3 folds) au-PRC (macro OvO): 0.905 +/- 0.022 (in 3 folds) Accuracy: 0.766 +/- 0.031 (in 3 folds) MCC: 0.665 +/- 0.040 (in 3 folds) Global scores: Accuracy: 0.766 MCC: 0.662 Global classification report:  precision recall f1-score support  Covid19 0.61 0.92 0.74 38  HIV 0.70 0.69 0.69 64 Healthy/Background 0.83 0.81 0.82 130  Lupus 0.93 0.62 0.74 42  accuracy 0.77 274  macro avg 0.77 0.76 0.75 274  weighted avg 0.79 0.77 0.77 274,Per-fold scores: ROC-AUC (weighted OvO): 0.894 +/- 0.018 (in 3 folds) ROC-AUC (macro OvO): 0.902 +/- 0.018 (in 3 folds) au-PRC (weighted OvO): 0.879 +/- 0.017 (in 3 folds) au-PRC (macro OvO): 0.891 +/- 0.017 (in 3 folds) Accuracy: 0.536 +/- 0.069 (in 3 folds) MCC: 0.209 +/- 0.195 (in 3 folds) Global scores: Accuracy: 0.536 MCC: 0.253 Global classification report:  precision recall f1-score support  Covid19 0.67 0.11 0.18 38  HIV 0.71 0.19 0.30 64 Healthy/Background 0.51 0.98 0.67 130  Lupus 1.00 0.10 0.17 42  accuracy 0.54 274  macro avg 0.72 0.34 0.33 274  weighted avg 0.65 0.54 0.44 274,Per-fold scores: ROC-AUC (weighted OvO): 0.891 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.886 +/- 0.013 (in 3 folds) au-PRC (weighted OvO): 0.889 +/- 0.011 (in 3 folds) au-PRC (macro OvO): 0.890 +/- 0.012 (in 3 folds) Accuracy: 0.730 +/- 0.034 (in 3 folds) MCC: 0.607 +/- 0.050 (in 3 folds) Global scores: Accuracy: 0.730 MCC: 0.597 Global classification report:  precision recall f1-score support  Covid19 0.66 0.71 0.68 38  HIV 0.63 0.59 0.61 64 Healthy/Background 0.77 0.83 0.80 130  Lupus 0.82 0.64 0.72 42  accuracy 0.73 274  macro avg 0.72 0.69 0.70 274  weighted avg 0.73 0.73 0.73 274
,,,


lasso_cv,rf_multiclass,elasticnet_cv,dummy_stratified
Per-fold scores: ROC-AUC (weighted OvO): 0.881 +/- 0.019 (in 3 folds) ROC-AUC (macro OvO): 0.887 +/- 0.012 (in 3 folds) au-PRC (weighted OvO): 0.874 +/- 0.017 (in 3 folds) au-PRC (macro OvO): 0.884 +/- 0.015 (in 3 folds) Accuracy: 0.632 +/- 0.063 (in 3 folds) MCC: 0.432 +/- 0.105 (in 3 folds) Global scores: Accuracy: 0.631 MCC: 0.433 Global classification report:  precision recall f1-score support  Covid19 0.80 0.21 0.33 38  HIV 0.76 0.50 0.60 64 Healthy/Background 0.58 0.95 0.72 130  Lupus 1.00 0.21 0.35 42  accuracy 0.63 274  macro avg 0.79 0.47 0.50 274  weighted avg 0.72 0.63 0.58 274,Per-fold scores: ROC-AUC (weighted OvO): 0.880 +/- 0.018 (in 3 folds) ROC-AUC (macro OvO): 0.882 +/- 0.021 (in 3 folds) au-PRC (weighted OvO): 0.880 +/- 0.019 (in 3 folds) au-PRC (macro OvO): 0.886 +/- 0.020 (in 3 folds) Accuracy: 0.715 +/- 0.034 (in 3 folds) MCC: 0.583 +/- 0.059 (in 3 folds) Global scores: Accuracy: 0.715 MCC: 0.570 Global classification report:  precision recall f1-score support  Covid19 0.68 0.61 0.64 38  HIV 0.65 0.58 0.61 64 Healthy/Background 0.74 0.85 0.79 130  Lupus 0.76 0.62 0.68 42  accuracy 0.72 274  macro avg 0.71 0.66 0.68 274  weighted avg 0.71 0.72 0.71 274,Per-fold scores: ROC-AUC (weighted OvO): 0.863 +/- 0.057 (in 3 folds) ROC-AUC (macro OvO): 0.863 +/- 0.064 (in 3 folds) au-PRC (weighted OvO): 0.851 +/- 0.054 (in 3 folds) au-PRC (macro OvO): 0.856 +/- 0.060 (in 3 folds) Accuracy: 0.598 +/- 0.058 (in 3 folds) MCC: 0.370 +/- 0.106 (in 3 folds) Global scores: Accuracy: 0.599 MCC: 0.370 Global classification report:  precision recall f1-score support  Covid19 0.62 0.26 0.37 38  HIV 0.71 0.39 0.51 64 Healthy/Background 0.56 0.92 0.70 130  Lupus 1.00 0.21 0.35 42  accuracy 0.60 274  macro avg 0.73 0.45 0.48 274  weighted avg 0.67 0.60 0.55 274,Per-fold scores: ROC-AUC (weighted OvO): 0.502 +/- 0.017 (in 3 folds) ROC-AUC (macro OvO): 0.509 +/- 0.012 (in 3 folds) au-PRC (weighted OvO): 0.512 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.516 +/- 0.005 (in 3 folds) Accuracy: 0.336 +/- 0.029 (in 3 folds) MCC: -0.003 +/- 0.046 (in 3 folds) Global scores: Accuracy: 0.336 MCC: -0.003 Global classification report:  precision recall f1-score support  Covid19 0.24 0.21 0.22 38  HIV 0.30 0.30 0.30 64 Healthy/Background 0.43 0.48 0.45 130  Lupus 0.09 0.07 0.08 42  accuracy 0.34 274  macro avg 0.26 0.26 0.26 274  weighted avg 0.32 0.34 0.33 274
,,,


dummy_most_frequent
Per-fold scores: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 3 folds) Accuracy: 0.474 +/- 0.003 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores: Accuracy: 0.474 MCC: 0.000 Global classification report:  precision recall f1-score support  Covid19 0.00 0.00 0.00 38  HIV 0.00 0.00 0.00 64 Healthy/Background 0.47 1.00 0.64 130  Lupus 0.00 0.00 0.00 42  accuracy 0.47 274  macro avg 0.12 0.25 0.16 274  weighted avg 0.23 0.47 0.31 274


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.894 +/- 0.019 (in 3 folds),0.905 +/- 0.018 (in 3 folds),0.871 +/- 0.026 (in 3 folds),0.889 +/- 0.024 (in 3 folds),0.534 +/- 0.081 (in 3 folds),0.214 +/- 0.215 (in 3 folds),0.534,0.264,disease.separate_past_exposures,,,,,,,,,,,,,414.0,0.0,414.0,0.0,False
ridge_cv.decision_thresholds_tuned,0.894 +/- 0.019 (in 3 folds),0.905 +/- 0.018 (in 3 folds),0.871 +/- 0.026 (in 3 folds),0.889 +/- 0.024 (in 3 folds),0.688 +/- 0.058 (in 3 folds),0.578 +/- 0.075 (in 3 folds),0.688,0.575,disease.separate_past_exposures,,,,,,,,,,,,,414.0,0.0,414.0,0.0,False
linearsvm_ovr,0.893 +/- 0.012 (in 3 folds),0.896 +/- 0.014 (in 3 folds),0.894 +/- 0.015 (in 3 folds),0.902 +/- 0.015 (in 3 folds),0.713 +/- 0.022 (in 3 folds),0.577 +/- 0.028 (in 3 folds),0.713,0.574,disease.separate_past_exposures,,,,,,,,,,,,,414.0,0.0,414.0,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.893 +/- 0.012 (in 3 folds),0.896 +/- 0.014 (in 3 folds),0.894 +/- 0.015 (in 3 folds),0.902 +/- 0.015 (in 3 folds),0.725 +/- 0.030 (in 3 folds),0.617 +/- 0.037 (in 3 folds),0.725,0.612,disease.separate_past_exposures,,,,,,,,,,,,,414.0,0.0,414.0,0.0,False
lasso_multiclass,0.885 +/- 0.005 (in 3 folds),0.886 +/- 0.004 (in 3 folds),0.879 +/- 0.011 (in 3 folds),0.884 +/- 0.011 (in 3 folds),0.702 +/- 0.016 (in 3 folds),0.575 +/- 0.023 (in 3 folds),0.702,0.569,disease.separate_past_exposures,0.701 +/- 0.017 (in 3 folds),0.573 +/- 0.021 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.887 +/- 0.002 (in 2 folds),0.889 +/- 0.002 (in 2 folds),0.885 +/- 0.007 (in 2 folds),0.890 +/- 0.003 (in 2 folds),0.7,0.567,0.002,Unknown,disease.separate_past_exposures,413.0,1.0,414.0,0.002415,False
lasso_multiclass.decision_thresholds_tuned,0.885 +/- 0.005 (in 3 folds),0.886 +/- 0.004 (in 3 folds),0.879 +/- 0.011 (in 3 folds),0.884 +/- 0.011 (in 3 folds),0.717 +/- 0.042 (in 3 folds),0.600 +/- 0.055 (in 3 folds),0.717,0.598,disease.separate_past_exposures,0.715 +/- 0.043 (in 3 folds),0.598 +/- 0.056 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.887 +/- 0.002 (in 2 folds),0.889 +/- 0.002 (in 2 folds),0.885 +/- 0.007 (in 2 folds),0.890 +/- 0.003 (in 2 folds),0.715,0.596,0.002,Unknown,disease.separate_past_exposures,413.0,1.0,414.0,0.002415,False
xgboost,0.883 +/- 0.003 (in 3 folds),0.882 +/- 0.005 (in 3 folds),0.876 +/- 0.008 (in 3 folds),0.880 +/- 0.006 (in 3 folds),0.714 +/- 0.011 (in 3 folds),0.572 +/- 0.015 (in 3 folds),0.714,0.571,disease.separate_past_exposures,0.713 +/- 0.012 (in 3 folds),0.570 +/- 0.016 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.883 +/- 0.004 (in 2 folds),0.881 +/- 0.006 (in 2 folds),0.881 +/- 0.004 (in 2 folds),0.883 +/- 0.004 (in 2 folds),0.713,0.569,0.002,Unknown,disease.separate_past_exposures,413.0,1.0,414.0,0.002415,False
xgboost.decision_thresholds_tuned,0.883 +/- 0.003 (in 3 folds),0.882 +/- 0.005 (in 3 folds),0.876 +/- 0.008 (in 3 folds),0.880 +/- 0.006 (in 3 folds),0.710 +/- 0.029 (in 3 folds),0.571 +/- 0.049 (in 3 folds),0.709,0.57,disease.separate_past_exposures,0.708 +/- 0.031 (in 3 folds),0.570 +/- 0.051 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.883 +/- 0.004 (in 2 folds),0.881 +/- 0.006 (in 2 folds),0.881 +/- 0.004 (in 2 folds),0.883 +/- 0.004 (in 2 folds),0.708,0.568,0.002,Unknown,disease.separate_past_exposures,413.0,1.0,414.0,0.002415,False
rf_multiclass,0.881 +/- 0.011 (in 3 folds),0.882 +/- 0.010 (in 3 folds),0.873 +/- 0.012 (in 3 folds),0.877 +/- 0.010 (in 3 folds),0.705 +/- 0.048 (in 3 folds),0.558 +/- 0.077 (in 3 folds),0.705,0.554,disease.separate_past_exposures,0.703 +/- 0.048 (in 3 folds),0.556 +/- 0.077 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.887 +/- 0.004 (in 2 folds),0.888 +/- 0.004 (in 2 folds),0.880 +/- 0.001 (in 2 folds),0.883 +/- 0.003 (in 2 folds),0.703,0.552,0.002,Unknown,disease.separate_past_exposures,413.0,1.0,414.0,0.002415,False
rf_multiclass.decision_thresholds_tuned,0.881 +/- 0.011 (in 3 folds),0.882 +/- 0.010 (in 3 folds),0.873 +/- 0.012 (in 3 folds),0.877 +/- 0.010 (in 3 folds),0.719 +/- 0.027 (in 3 folds),0.593 +/- 0.041 (in 3 folds),0.719,0.592,disease.separate_past_exposures,0.718 +/- 0.028 (in 3 folds),0.591 +/- 0.041 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.887 +/- 0.004 (in 2 folds),0.888 +/- 0.004 (in 2 folds),0.880 +/- 0.001 (in 2 folds),0.883 +/- 0.003 (in 2 folds),0.717,0.589,0.002,Unknown,disease.separate_past_exposures,413.0,1.0,414.0,0.002415,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.894 +/- 0.019 (in 3 folds),0.905 +/- 0.018 (in 3 folds),0.871 +/- 0.026 (in 3 folds),0.889 +/- 0.024 (in 3 folds),0.534 +/- 0.081 (in 3 folds),0.214 +/- 0.215 (in 3 folds),0.534,0.264,disease.separate_past_exposures,,,,,,,,,,,,,414,0,414,0.0,False
ridge_cv.decision_thresholds_tuned,0.894 +/- 0.019 (in 3 folds),0.905 +/- 0.018 (in 3 folds),0.871 +/- 0.026 (in 3 folds),0.889 +/- 0.024 (in 3 folds),0.688 +/- 0.058 (in 3 folds),0.578 +/- 0.075 (in 3 folds),0.688,0.575,disease.separate_past_exposures,,,,,,,,,,,,,414,0,414,0.0,False
linearsvm_ovr,0.893 +/- 0.012 (in 3 folds),0.896 +/- 0.014 (in 3 folds),0.894 +/- 0.015 (in 3 folds),0.902 +/- 0.015 (in 3 folds),0.713 +/- 0.022 (in 3 folds),0.577 +/- 0.028 (in 3 folds),0.713,0.574,disease.separate_past_exposures,,,,,,,,,,,,,414,0,414,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.893 +/- 0.012 (in 3 folds),0.896 +/- 0.014 (in 3 folds),0.894 +/- 0.015 (in 3 folds),0.902 +/- 0.015 (in 3 folds),0.725 +/- 0.030 (in 3 folds),0.617 +/- 0.037 (in 3 folds),0.725,0.612,disease.separate_past_exposures,,,,,,,,,,,,,414,0,414,0.0,False
lasso_multiclass,0.885 +/- 0.005 (in 3 folds),0.886 +/- 0.004 (in 3 folds),0.879 +/- 0.011 (in 3 folds),0.884 +/- 0.011 (in 3 folds),0.702 +/- 0.016 (in 3 folds),0.575 +/- 0.023 (in 3 folds),0.702,0.569,disease.separate_past_exposures,0.701 +/- 0.017 (in 3 folds),0.573 +/- 0.021 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.887 +/- 0.002 (in 2 folds),0.889 +/- 0.002 (in 2 folds),0.885 +/- 0.007 (in 2 folds),0.890 +/- 0.003 (in 2 folds),0.7,0.567,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False
lasso_multiclass.decision_thresholds_tuned,0.885 +/- 0.005 (in 3 folds),0.886 +/- 0.004 (in 3 folds),0.879 +/- 0.011 (in 3 folds),0.884 +/- 0.011 (in 3 folds),0.717 +/- 0.042 (in 3 folds),0.600 +/- 0.055 (in 3 folds),0.717,0.598,disease.separate_past_exposures,0.715 +/- 0.043 (in 3 folds),0.598 +/- 0.056 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.887 +/- 0.002 (in 2 folds),0.889 +/- 0.002 (in 2 folds),0.885 +/- 0.007 (in 2 folds),0.890 +/- 0.003 (in 2 folds),0.715,0.596,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False
xgboost,0.883 +/- 0.003 (in 3 folds),0.882 +/- 0.005 (in 3 folds),0.876 +/- 0.008 (in 3 folds),0.880 +/- 0.006 (in 3 folds),0.714 +/- 0.011 (in 3 folds),0.572 +/- 0.015 (in 3 folds),0.714,0.571,disease.separate_past_exposures,0.713 +/- 0.012 (in 3 folds),0.570 +/- 0.016 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.883 +/- 0.004 (in 2 folds),0.881 +/- 0.006 (in 2 folds),0.881 +/- 0.004 (in 2 folds),0.883 +/- 0.004 (in 2 folds),0.713,0.569,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False
xgboost.decision_thresholds_tuned,0.883 +/- 0.003 (in 3 folds),0.882 +/- 0.005 (in 3 folds),0.876 +/- 0.008 (in 3 folds),0.880 +/- 0.006 (in 3 folds),0.710 +/- 0.029 (in 3 folds),0.571 +/- 0.049 (in 3 folds),0.709,0.57,disease.separate_past_exposures,0.708 +/- 0.031 (in 3 folds),0.570 +/- 0.051 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.883 +/- 0.004 (in 2 folds),0.881 +/- 0.006 (in 2 folds),0.881 +/- 0.004 (in 2 folds),0.883 +/- 0.004 (in 2 folds),0.708,0.568,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False
rf_multiclass,0.881 +/- 0.011 (in 3 folds),0.882 +/- 0.010 (in 3 folds),0.873 +/- 0.012 (in 3 folds),0.877 +/- 0.010 (in 3 folds),0.705 +/- 0.048 (in 3 folds),0.558 +/- 0.077 (in 3 folds),0.705,0.554,disease.separate_past_exposures,0.703 +/- 0.048 (in 3 folds),0.556 +/- 0.077 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.887 +/- 0.004 (in 2 folds),0.888 +/- 0.004 (in 2 folds),0.880 +/- 0.001 (in 2 folds),0.883 +/- 0.003 (in 2 folds),0.703,0.552,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False
rf_multiclass.decision_thresholds_tuned,0.881 +/- 0.011 (in 3 folds),0.882 +/- 0.010 (in 3 folds),0.873 +/- 0.012 (in 3 folds),0.877 +/- 0.010 (in 3 folds),0.719 +/- 0.027 (in 3 folds),0.593 +/- 0.041 (in 3 folds),0.719,0.592,disease.separate_past_exposures,0.718 +/- 0.028 (in 3 folds),0.591 +/- 0.041 (in 3 folds),0.007 +/- 0.000 (in 1 folds),0.887 +/- 0.004 (in 2 folds),0.888 +/- 0.004 (in 2 folds),0.880 +/- 0.001 (in 2 folds),0.883 +/- 0.003 (in 2 folds),0.717,0.589,0.002,Unknown,disease.separate_past_exposures,413,1,414,0.002415,False


ridge_cv,ridge_cv.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores: ROC-AUC (weighted OvO): 0.894 +/- 0.019 (in 3 folds) ROC-AUC (macro OvO): 0.905 +/- 0.018 (in 3 folds) au-PRC (weighted OvO): 0.871 +/- 0.026 (in 3 folds) au-PRC (macro OvO): 0.889 +/- 0.024 (in 3 folds) Accuracy: 0.534 +/- 0.081 (in 3 folds) MCC: 0.214 +/- 0.215 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.534 MCC: 0.264 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.90 0.16 0.26 58  HIV 0.83 0.19 0.31 98 Healthy/Background 0.50 0.97 0.66 194  Lupus 1.00 0.06 0.12 64  accuracy 0.53 414  macro avg 0.81 0.35 0.34 414  weighted avg 0.71 0.53 0.44 414,Per-fold scores: ROC-AUC (weighted OvO): 0.894 +/- 0.019 (in 3 folds) ROC-AUC (macro OvO): 0.905 +/- 0.018 (in 3 folds) au-PRC (weighted OvO): 0.871 +/- 0.026 (in 3 folds) au-PRC (macro OvO): 0.889 +/- 0.024 (in 3 folds) Accuracy: 0.688 +/- 0.058 (in 3 folds) MCC: 0.578 +/- 0.075 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.688 MCC: 0.575 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.54 0.97 0.69 58  HIV 0.69 0.71 0.70 98 Healthy/Background 0.82 0.63 0.71 194  Lupus 0.62 0.58 0.60 64  accuracy 0.69 414  macro avg 0.67 0.72 0.68 414  weighted avg 0.72 0.69 0.69 414,Per-fold scores: ROC-AUC (weighted OvO): 0.893 +/- 0.012 (in 3 folds) ROC-AUC (macro OvO): 0.896 +/- 0.014 (in 3 folds) au-PRC (weighted OvO): 0.894 +/- 0.015 (in 3 folds) au-PRC (macro OvO): 0.902 +/- 0.015 (in 3 folds) Accuracy: 0.713 +/- 0.022 (in 3 folds) MCC: 0.577 +/- 0.028 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.713 MCC: 0.574 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.67 0.84 0.75 58  HIV 0.69 0.65 0.67 98 Healthy/Background 0.71 0.77 0.74 194  Lupus 0.89 0.52 0.65 64  accuracy 0.71 414  macro avg 0.74 0.70 0.70 414  weighted avg 0.73 0.71 0.71 414,Per-fold scores: ROC-AUC (weighted OvO): 0.893 +/- 0.012 (in 3 folds) ROC-AUC (macro OvO): 0.896 +/- 0.014 (in 3 folds) au-PRC (weighted OvO): 0.894 +/- 0.015 (in 3 folds) au-PRC (macro OvO): 0.902 +/- 0.015 (in 3 folds) Accuracy: 0.725 +/- 0.030 (in 3 folds) MCC: 0.617 +/- 0.037 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.725 MCC: 0.612 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.62 0.97 0.75 58  HIV 0.65 0.71 0.68 98 Healthy/Background 0.82 0.71 0.76 194  Lupus 0.77 0.56 0.65 64  accuracy 0.72 414  macro avg 0.71 0.74 0.71 414  weighted avg 0.74 0.72 0.72 414
,,,


lasso_multiclass,lasso_multiclass.decision_thresholds_tuned,xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.885 +/- 0.005 (in 3 folds) ROC-AUC (macro OvO): 0.886 +/- 0.004 (in 3 folds) au-PRC (weighted OvO): 0.879 +/- 0.011 (in 3 folds) au-PRC (macro OvO): 0.884 +/- 0.011 (in 3 folds) Accuracy: 0.702 +/- 0.016 (in 3 folds) MCC: 0.575 +/- 0.023 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.702 MCC: 0.569 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.701 +/- 0.017 (in 3 folds) MCC: 0.573 +/- 0.021 (in 3 folds) Unknown/abstention proportion: 0.007 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.887 +/- 0.002 (in 2 folds) ROC-AUC (macro OvO): 0.889 +/- 0.002 (in 2 folds) au-PRC (weighted OvO): 0.885 +/- 0.007 (in 2 folds) au-PRC (macro OvO): 0.890 +/- 0.003 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.700 MCC: 0.567 Unknown/abstention proportion: 0.002 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.57 0.86 0.69 58  HIV 0.68 0.68 0.68 98 Healthy/Background 0.76 0.74 0.75 194  Lupus 0.79 0.47 0.59 64  Unknown 0.00 0.00 0.00 0  accuracy 0.70 414  macro avg 0.56 0.55 0.54 414  weighted avg 0.72 0.70 0.70 414,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.885 +/- 0.005 (in 3 folds) ROC-AUC (macro OvO): 0.886 +/- 0.004 (in 3 folds) au-PRC (weighted OvO): 0.879 +/- 0.011 (in 3 folds) au-PRC (macro OvO): 0.884 +/- 0.011 (in 3 folds) Accuracy: 0.717 +/- 0.042 (in 3 folds) MCC: 0.600 +/- 0.055 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.717 MCC: 0.598 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.715 +/- 0.043 (in 3 folds) MCC: 0.598 +/- 0.056 (in 3 folds) Unknown/abstention proportion: 0.007 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.887 +/- 0.002 (in 2 folds) ROC-AUC (macro OvO): 0.889 +/- 0.002 (in 2 folds) au-PRC (weighted OvO): 0.885 +/- 0.007 (in 2 folds) au-PRC (macro OvO): 0.890 +/- 0.003 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.715 MCC: 0.596 Unknown/abstention proportion: 0.002 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.57 0.86 0.68 58  HIV 0.68 0.73 0.71 98 Healthy/Background 0.81 0.71 0.76 194  Lupus 0.75 0.56 0.64 64  Unknown 0.00 0.00 0.00 0  accuracy 0.71 414  macro avg 0.56 0.57 0.56 414  weighted avg 0.73 0.71 0.72 414,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.883 +/- 0.003 (in 3 folds) ROC-AUC (macro OvO): 0.882 +/- 0.005 (in 3 folds) au-PRC (weighted OvO): 0.876 +/- 0.008 (in 3 folds) au-PRC (macro OvO): 0.880 +/- 0.006 (in 3 folds) Accuracy: 0.714 +/- 0.011 (in 3 folds) MCC: 0.572 +/- 0.015 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.714 MCC: 0.571 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.713 +/- 0.012 (in 3 folds) MCC: 0.570 +/- 0.016 (in 3 folds) Unknown/abstention proportion: 0.007 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.883 +/- 0.004 (in 2 folds) ROC-AUC (macro OvO): 0.881 +/- 0.006 (in 2 folds) au-PRC (weighted OvO): 0.881 +/- 0.004 (in 2 folds) au-PRC (macro OvO): 0.883 +/- 0.004 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.713 MCC: 0.569 Unknown/abstention proportion: 0.002 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.65 0.57 0.61 58  HIV 0.71 0.61 0.66 98 Healthy/Background 0.73 0.83 0.77 194  Lupus 0.73 0.64 0.68 64  Unknown 0.00 0.00 0.00 0  accuracy 0.71 414  macro avg 0.56 0.53 0.54 414  weighted avg 0.71 0.71 0.71 414,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.883 +/- 0.003 (in 3 folds) ROC-AUC (macro OvO): 0.882 +/- 0.005 (in 3 folds) au-PRC (weighted OvO): 0.876 +/- 0.008 (in 3 folds) au-PRC (macro OvO): 0.880 +/- 0.006 (in 3 folds) Accuracy: 0.710 +/- 0.029 (in 3 folds) MCC: 0.571 +/- 0.049 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.709 MCC: 0.570 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.708 +/- 0.031 (in 3 folds) MCC: 0.570 +/- 0.051 (in 3 folds) Unknown/abstention proportion: 0.007 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.883 +/- 0.004 (in 2 folds) ROC-AUC (macro OvO): 0.881 +/- 0.006 (in 2 folds) au-PRC (weighted OvO): 0.881 +/- 0.004 (in 2 folds) au-PRC (macro OvO): 0.883 +/- 0.004 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.708 MCC: 0.568 Unknown/abstention proportion: 0.002 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.57 0.62 0.60 58  HIV 0.67 0.67 0.67 98 Healthy/Background 0.76 0.79 0.77 194  Lupus 0.76 0.59 0.67 64  Unknown 0.00 0.00 0.00 0  accuracy 0.71 414  macro avg 0.55 0.54 0.54 414  weighted avg 0.71 0.71 0.71 414
,,,


rf_multiclass,rf_multiclass.decision_thresholds_tuned,elasticnet_cv,elasticnet_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.881 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.882 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.873 +/- 0.012 (in 3 folds) au-PRC (macro OvO): 0.877 +/- 0.010 (in 3 folds) Accuracy: 0.705 +/- 0.048 (in 3 folds) MCC: 0.558 +/- 0.077 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.705 MCC: 0.554 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.703 +/- 0.048 (in 3 folds) MCC: 0.556 +/- 0.077 (in 3 folds) Unknown/abstention proportion: 0.007 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.887 +/- 0.004 (in 2 folds) ROC-AUC (macro OvO): 0.888 +/- 0.004 (in 2 folds) au-PRC (weighted OvO): 0.880 +/- 0.001 (in 2 folds) au-PRC (macro OvO): 0.883 +/- 0.003 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.703 MCC: 0.552 Unknown/abstention proportion: 0.002 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.64 0.55 0.59 58  HIV 0.67 0.57 0.62 98 Healthy/Background 0.71 0.85 0.77 194  Lupus 0.78 0.61 0.68 64  Unknown 0.00 0.00 0.00 0  accuracy 0.70 414  macro avg 0.56 0.52 0.53 414  weighted avg 0.70 0.70 0.70 414,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.881 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.882 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.873 +/- 0.012 (in 3 folds) au-PRC (macro OvO): 0.877 +/- 0.010 (in 3 folds) Accuracy: 0.719 +/- 0.027 (in 3 folds) MCC: 0.593 +/- 0.041 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.719 MCC: 0.592 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.718 +/- 0.028 (in 3 folds) MCC: 0.591 +/- 0.041 (in 3 folds) Unknown/abstention proportion: 0.007 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.887 +/- 0.004 (in 2 folds) ROC-AUC (macro OvO): 0.888 +/- 0.004 (in 2 folds) au-PRC (weighted OvO): 0.880 +/- 0.001 (in 2 folds) au-PRC (macro OvO): 0.883 +/- 0.003 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.717 MCC: 0.589 Unknown/abstention proportion: 0.002 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.57 0.81 0.67 58  HIV 0.66 0.61 0.63 98 Healthy/Background 0.79 0.78 0.79 194  Lupus 0.83 0.59 0.69 64  Unknown 0.00 0.00 0.00 0  accuracy 0.72 414  macro avg 0.57 0.56 0.56 414  weighted avg 0.73 0.72 0.72 414,Per-fold scores: ROC-AUC (weighted OvO): 0.866 +/- 0.056 (in 3 folds) ROC-AUC (macro OvO): 0.869 +/- 0.063 (in 3 folds) au-PRC (weighted OvO): 0.858 +/- 0.046 (in 3 folds) au-PRC (macro OvO): 0.867 +/- 0.055 (in 3 folds) Accuracy: 0.602 +/- 0.084 (in 3 folds) MCC: 0.374 +/- 0.151 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.601 MCC: 0.381 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.77 0.29 0.42 58  HIV 0.74 0.46 0.57 98 Healthy/Background 0.55 0.92 0.69 194  Lupus 1.00 0.12 0.22 64  accuracy 0.60 414  macro avg 0.77 0.45 0.48 414  weighted avg 0.70 0.60 0.55 414,Per-fold scores: ROC-AUC (weighted OvO): 0.866 +/- 0.056 (in 3 folds) ROC-AUC (macro OvO): 0.869 +/- 0.063 (in 3 folds) au-PRC (weighted OvO): 0.858 +/- 0.046 (in 3 folds) au-PRC (macro OvO): 0.867 +/- 0.055 (in 3 folds) Accuracy: 0.625 +/- 0.022 (in 3 folds) MCC: 0.474 +/- 0.041 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.626 MCC: 0.471 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.47 0.98 0.63 58  HIV 0.61 0.32 0.42 98 Healthy/Background 0.71 0.72 0.72 194  Lupus 0.69 0.48 0.57 64  accuracy 0.63 414  macro avg 0.62 0.63 0.58 414  weighted avg 0.65 0.63 0.61 414
,,,


lasso_cv,lasso_cv.decision_thresholds_tuned
Per-fold scores: ROC-AUC (weighted OvO): 0.860 +/- 0.032 (in 3 folds) ROC-AUC (macro OvO): 0.865 +/- 0.032 (in 3 folds) au-PRC (weighted OvO): 0.858 +/- 0.029 (in 3 folds) au-PRC (macro OvO): 0.868 +/- 0.030 (in 3 folds) Accuracy: 0.584 +/- 0.070 (in 3 folds) MCC: 0.343 +/- 0.128 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.585 MCC: 0.349 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.65 0.19 0.29 58  HIV 0.73 0.44 0.55 98 Healthy/Background 0.54 0.92 0.68 194  Lupus 1.00 0.14 0.25 64  accuracy 0.58 414  macro avg 0.73 0.42 0.44 414  weighted avg 0.67 0.58 0.53 414,Per-fold scores: ROC-AUC (weighted OvO): 0.860 +/- 0.032 (in 3 folds) ROC-AUC (macro OvO): 0.865 +/- 0.032 (in 3 folds) au-PRC (weighted OvO): 0.858 +/- 0.029 (in 3 folds) au-PRC (macro OvO): 0.868 +/- 0.030 (in 3 folds) Accuracy: 0.681 +/- 0.042 (in 3 folds) MCC: 0.569 +/- 0.053 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.681 MCC: 0.556 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.59 0.95 0.73 58  HIV 0.63 0.70 0.67 98 Healthy/Background 0.79 0.64 0.71 194  Lupus 0.62 0.53 0.57 64  accuracy 0.68 414  macro avg 0.66 0.71 0.67 414  weighted avg 0.70 0.68 0.68 414
,


---

# GeneLocus.TCR, TargetObsColumnEnum.disease_all_demographics_present trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.907 +/- 0.009 (in 3 folds),0.906 +/- 0.016 (in 3 folds),0.889 +/- 0.006 (in 3 folds),0.892 +/- 0.002 (in 3 folds),0.749 +/- 0.028 (in 3 folds),0.639 +/- 0.055 (in 3 folds),0.749,0.636,0.912 +/- 0.003 (in 2 folds),0.915 +/- 0.002 (in 2 folds),0.886 +/- 0.000 (in 2 folds),0.893 +/- 0.001 (in 2 folds),0.746 +/- 0.029 (in 3 folds),0.636 +/- 0.056 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.746,0.633,0.004,Unknown,239.0,1.0,240.0,0.004167,False
lasso_multiclass,0.906 +/- 0.012 (in 3 folds),0.905 +/- 0.017 (in 3 folds),0.897 +/- 0.011 (in 3 folds),0.899 +/- 0.010 (in 3 folds),0.761 +/- 0.016 (in 3 folds),0.671 +/- 0.033 (in 3 folds),0.762,0.668,0.912 +/- 0.010 (in 2 folds),0.914 +/- 0.007 (in 2 folds),0.898 +/- 0.015 (in 2 folds),0.903 +/- 0.011 (in 2 folds),0.758 +/- 0.017 (in 3 folds),0.668 +/- 0.036 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.758,0.664,0.004,Unknown,239.0,1.0,240.0,0.004167,False
ridge_cv,0.889 +/- 0.008 (in 3 folds),0.892 +/- 0.013 (in 3 folds),0.874 +/- 0.010 (in 3 folds),0.881 +/- 0.016 (in 3 folds),0.547 +/- 0.115 (in 3 folds),0.174 +/- 0.301 (in 3 folds),0.548,0.286,0.893 +/- 0.003 (in 2 folds),0.899 +/- 0.000 (in 2 folds),0.880 +/- 0.002 (in 2 folds),0.889 +/- 0.006 (in 2 folds),0.545 +/- 0.117 (in 3 folds),0.189 +/- 0.289 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.546,0.284,0.004,Unknown,239.0,1.0,240.0,0.004167,False
xgboost,0.885 +/- 0.024 (in 3 folds),0.884 +/- 0.024 (in 3 folds),0.878 +/- 0.033 (in 3 folds),0.882 +/- 0.032 (in 3 folds),0.758 +/- 0.031 (in 3 folds),0.643 +/- 0.046 (in 3 folds),0.758,0.638,,,,,,,,,,,,240.0,0.0,240.0,0.0,False
rf_multiclass,0.885 +/- 0.014 (in 3 folds),0.882 +/- 0.008 (in 3 folds),0.881 +/- 0.016 (in 3 folds),0.879 +/- 0.009 (in 3 folds),0.716 +/- 0.022 (in 3 folds),0.573 +/- 0.032 (in 3 folds),0.715,0.571,0.886 +/- 0.019 (in 2 folds),0.884 +/- 0.011 (in 2 folds),0.878 +/- 0.022 (in 2 folds),0.879 +/- 0.013 (in 2 folds),0.713 +/- 0.019 (in 3 folds),0.569 +/- 0.027 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.713,0.568,0.004,Unknown,239.0,1.0,240.0,0.004167,False
elasticnet_cv,0.882 +/- 0.016 (in 3 folds),0.879 +/- 0.021 (in 3 folds),0.853 +/- 0.029 (in 3 folds),0.856 +/- 0.028 (in 3 folds),0.603 +/- 0.102 (in 3 folds),0.371 +/- 0.180 (in 3 folds),0.603,0.374,0.886 +/- 0.020 (in 2 folds),0.887 +/- 0.021 (in 2 folds),0.851 +/- 0.041 (in 2 folds),0.859 +/- 0.039 (in 2 folds),0.600 +/- 0.105 (in 3 folds),0.371 +/- 0.179 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.6,0.372,0.004,Unknown,239.0,1.0,240.0,0.004167,False
lasso_cv,0.876 +/- 0.027 (in 3 folds),0.876 +/- 0.035 (in 3 folds),0.864 +/- 0.030 (in 3 folds),0.870 +/- 0.033 (in 3 folds),0.615 +/- 0.049 (in 3 folds),0.388 +/- 0.104 (in 3 folds),0.615,0.392,0.892 +/- 0.004 (in 2 folds),0.896 +/- 0.003 (in 2 folds),0.881 +/- 0.002 (in 2 folds),0.889 +/- 0.001 (in 2 folds),0.612 +/- 0.050 (in 3 folds),0.387 +/- 0.104 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.613,0.39,0.004,Unknown,239.0,1.0,240.0,0.004167,False
dummy_stratified,0.531 +/- 0.035 (in 3 folds),0.523 +/- 0.032 (in 3 folds),0.529 +/- 0.023 (in 3 folds),0.526 +/- 0.020 (in 3 folds),0.405 +/- 0.062 (in 3 folds),0.088 +/- 0.087 (in 3 folds),0.404,0.086,,,,,,,,,,,,240.0,0.0,240.0,0.0,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.481 +/- 0.013 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.481,0.0,0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.479 +/- 0.016 (in 3 folds),0.015 +/- 0.026 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.479,0.027,0.004,Unknown,239.0,1.0,240.0,0.004167,True
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.907 +/- 0.009 (in 3 folds),0.906 +/- 0.016 (in 3 folds),0.889 +/- 0.006 (in 3 folds),0.892 +/- 0.002 (in 3 folds),0.749 +/- 0.028 (in 3 folds),0.639 +/- 0.055 (in 3 folds),0.749,0.636,0.912 +/- 0.003 (in 2 folds),0.915 +/- 0.002 (in 2 folds),0.886 +/- 0.000 (in 2 folds),0.893 +/- 0.001 (in 2 folds),0.746 +/- 0.029 (in 3 folds),0.636 +/- 0.056 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.746,0.633,0.004,Unknown,239,1,240,0.004167,False
lasso_multiclass,0.906 +/- 0.012 (in 3 folds),0.905 +/- 0.017 (in 3 folds),0.897 +/- 0.011 (in 3 folds),0.899 +/- 0.010 (in 3 folds),0.761 +/- 0.016 (in 3 folds),0.671 +/- 0.033 (in 3 folds),0.762,0.668,0.912 +/- 0.010 (in 2 folds),0.914 +/- 0.007 (in 2 folds),0.898 +/- 0.015 (in 2 folds),0.903 +/- 0.011 (in 2 folds),0.758 +/- 0.017 (in 3 folds),0.668 +/- 0.036 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.758,0.664,0.004,Unknown,239,1,240,0.004167,False
ridge_cv,0.889 +/- 0.008 (in 3 folds),0.892 +/- 0.013 (in 3 folds),0.874 +/- 0.010 (in 3 folds),0.881 +/- 0.016 (in 3 folds),0.547 +/- 0.115 (in 3 folds),0.174 +/- 0.301 (in 3 folds),0.548,0.286,0.893 +/- 0.003 (in 2 folds),0.899 +/- 0.000 (in 2 folds),0.880 +/- 0.002 (in 2 folds),0.889 +/- 0.006 (in 2 folds),0.545 +/- 0.117 (in 3 folds),0.189 +/- 0.289 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.546,0.284,0.004,Unknown,239,1,240,0.004167,False
xgboost,0.885 +/- 0.024 (in 3 folds),0.884 +/- 0.024 (in 3 folds),0.878 +/- 0.033 (in 3 folds),0.882 +/- 0.032 (in 3 folds),0.758 +/- 0.031 (in 3 folds),0.643 +/- 0.046 (in 3 folds),0.758,0.638,,,,,,,,,,,,240,0,240,0.0,False
rf_multiclass,0.885 +/- 0.014 (in 3 folds),0.882 +/- 0.008 (in 3 folds),0.881 +/- 0.016 (in 3 folds),0.879 +/- 0.009 (in 3 folds),0.716 +/- 0.022 (in 3 folds),0.573 +/- 0.032 (in 3 folds),0.715,0.571,0.886 +/- 0.019 (in 2 folds),0.884 +/- 0.011 (in 2 folds),0.878 +/- 0.022 (in 2 folds),0.879 +/- 0.013 (in 2 folds),0.713 +/- 0.019 (in 3 folds),0.569 +/- 0.027 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.713,0.568,0.004,Unknown,239,1,240,0.004167,False
elasticnet_cv,0.882 +/- 0.016 (in 3 folds),0.879 +/- 0.021 (in 3 folds),0.853 +/- 0.029 (in 3 folds),0.856 +/- 0.028 (in 3 folds),0.603 +/- 0.102 (in 3 folds),0.371 +/- 0.180 (in 3 folds),0.603,0.374,0.886 +/- 0.020 (in 2 folds),0.887 +/- 0.021 (in 2 folds),0.851 +/- 0.041 (in 2 folds),0.859 +/- 0.039 (in 2 folds),0.600 +/- 0.105 (in 3 folds),0.371 +/- 0.179 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.6,0.372,0.004,Unknown,239,1,240,0.004167,False
lasso_cv,0.876 +/- 0.027 (in 3 folds),0.876 +/- 0.035 (in 3 folds),0.864 +/- 0.030 (in 3 folds),0.870 +/- 0.033 (in 3 folds),0.615 +/- 0.049 (in 3 folds),0.388 +/- 0.104 (in 3 folds),0.615,0.392,0.892 +/- 0.004 (in 2 folds),0.896 +/- 0.003 (in 2 folds),0.881 +/- 0.002 (in 2 folds),0.889 +/- 0.001 (in 2 folds),0.612 +/- 0.050 (in 3 folds),0.387 +/- 0.104 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.613,0.39,0.004,Unknown,239,1,240,0.004167,False
dummy_stratified,0.531 +/- 0.035 (in 3 folds),0.523 +/- 0.032 (in 3 folds),0.529 +/- 0.023 (in 3 folds),0.526 +/- 0.020 (in 3 folds),0.405 +/- 0.062 (in 3 folds),0.088 +/- 0.087 (in 3 folds),0.404,0.086,,,,,,,,,,,,240,0,240,0.0,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.481 +/- 0.013 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.481,0.0,0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.479 +/- 0.016 (in 3 folds),0.015 +/- 0.026 (in 3 folds),0.013 +/- 0.000 (in 1 folds),0.479,0.027,0.004,Unknown,239,1,240,0.004167,True


linearsvm_ovr,lasso_multiclass,ridge_cv,xgboost
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.907 +/- 0.009 (in 3 folds) ROC-AUC (macro OvO): 0.906 +/- 0.016 (in 3 folds) au-PRC (weighted OvO): 0.889 +/- 0.006 (in 3 folds) au-PRC (macro OvO): 0.892 +/- 0.002 (in 3 folds) Accuracy: 0.749 +/- 0.028 (in 3 folds) MCC: 0.639 +/- 0.055 (in 3 folds) Global scores without abstention: Accuracy: 0.749 MCC: 0.636 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.912 +/- 0.003 (in 2 folds) ROC-AUC (macro OvO): 0.915 +/- 0.002 (in 2 folds) au-PRC (weighted OvO): 0.886 +/- 0.000 (in 2 folds) au-PRC (macro OvO): 0.893 +/- 0.001 (in 2 folds) Accuracy: 0.746 +/- 0.029 (in 3 folds) MCC: 0.636 +/- 0.056 (in 3 folds) Unknown/abstention proportion: 0.013 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.746 MCC: 0.633 Unknown/abstention proportion: 0.004 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.52 0.80 0.63 30  HIV 0.74 0.64 0.69 55 Healthy/Background 0.84 0.80 0.82 115  Lupus 0.78 0.70 0.74 40  Unknown 0.00 0.00 0.00 0  accuracy 0.75 240  macro avg 0.58 0.59 0.57 240  weighted avg 0.77 0.75 0.75 240,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.906 +/- 0.012 (in 3 folds) ROC-AUC (macro OvO): 0.905 +/- 0.017 (in 3 folds) au-PRC (weighted OvO): 0.897 +/- 0.011 (in 3 folds) au-PRC (macro OvO): 0.899 +/- 0.010 (in 3 folds) Accuracy: 0.761 +/- 0.016 (in 3 folds) MCC: 0.671 +/- 0.033 (in 3 folds) Global scores without abstention: Accuracy: 0.762 MCC: 0.668 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.912 +/- 0.010 (in 2 folds) ROC-AUC (macro OvO): 0.914 +/- 0.007 (in 2 folds) au-PRC (weighted OvO): 0.898 +/- 0.015 (in 2 folds) au-PRC (macro OvO): 0.903 +/- 0.011 (in 2 folds) Accuracy: 0.758 +/- 0.017 (in 3 folds) MCC: 0.668 +/- 0.036 (in 3 folds) Unknown/abstention proportion: 0.013 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.758 MCC: 0.664 Unknown/abstention proportion: 0.004 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.54 0.90 0.68 30  HIV 0.72 0.71 0.72 55 Healthy/Background 0.92 0.76 0.83 115  Lupus 0.72 0.72 0.73 40  Unknown 0.00 0.00 0.00 0  accuracy 0.76 240  macro avg 0.58 0.62 0.59 240  weighted avg 0.79 0.76 0.77 240,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.889 +/- 0.008 (in 3 folds) ROC-AUC (macro OvO): 0.892 +/- 0.013 (in 3 folds) au-PRC (weighted OvO): 0.874 +/- 0.010 (in 3 folds) au-PRC (macro OvO): 0.881 +/- 0.016 (in 3 folds) Accuracy: 0.547 +/- 0.115 (in 3 folds) MCC: 0.174 +/- 0.301 (in 3 folds) Global scores without abstention: Accuracy: 0.548 MCC: 0.286 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.893 +/- 0.003 (in 2 folds) ROC-AUC (macro OvO): 0.899 +/- 0.000 (in 2 folds) au-PRC (weighted OvO): 0.880 +/- 0.002 (in 2 folds) au-PRC (macro OvO): 0.889 +/- 0.006 (in 2 folds) Accuracy: 0.545 +/- 0.117 (in 3 folds) MCC: 0.189 +/- 0.289 (in 3 folds) Unknown/abstention proportion: 0.013 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.546 MCC: 0.284 Unknown/abstention proportion: 0.004 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.75 0.10 0.18 30  HIV 0.90 0.16 0.28 55 Healthy/Background 0.52 1.00 0.68 115  Lupus 1.00 0.10 0.18 40  Unknown 0.00 0.00 0.00 0  accuracy 0.55 240  macro avg 0.63 0.27 0.26 240  weighted avg 0.72 0.55 0.44 240,Per-fold scores: ROC-AUC (weighted OvO): 0.885 +/- 0.024 (in 3 folds) ROC-AUC (macro OvO): 0.884 +/- 0.024 (in 3 folds) au-PRC (weighted OvO): 0.878 +/- 0.033 (in 3 folds) au-PRC (macro OvO): 0.882 +/- 0.032 (in 3 folds) Accuracy: 0.758 +/- 0.031 (in 3 folds) MCC: 0.643 +/- 0.046 (in 3 folds) Global scores: Accuracy: 0.758 MCC: 0.638 Global classification report:  precision recall f1-score support  Covid19 0.59 0.57 0.58 30  HIV 0.71 0.64 0.67 55 Healthy/Background 0.79 0.84 0.82 115  Lupus 0.85 0.82 0.84 40  accuracy 0.76 240  macro avg 0.73 0.72 0.72 240  weighted avg 0.76 0.76 0.76 240
,,,


rf_multiclass,elasticnet_cv,lasso_cv,dummy_stratified
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.885 +/- 0.014 (in 3 folds) ROC-AUC (macro OvO): 0.882 +/- 0.008 (in 3 folds) au-PRC (weighted OvO): 0.881 +/- 0.016 (in 3 folds) au-PRC (macro OvO): 0.879 +/- 0.009 (in 3 folds) Accuracy: 0.716 +/- 0.022 (in 3 folds) MCC: 0.573 +/- 0.032 (in 3 folds) Global scores without abstention: Accuracy: 0.715 MCC: 0.571 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.886 +/- 0.019 (in 2 folds) ROC-AUC (macro OvO): 0.884 +/- 0.011 (in 2 folds) au-PRC (weighted OvO): 0.878 +/- 0.022 (in 2 folds) au-PRC (macro OvO): 0.879 +/- 0.013 (in 2 folds) Accuracy: 0.713 +/- 0.019 (in 3 folds) MCC: 0.569 +/- 0.027 (in 3 folds) Unknown/abstention proportion: 0.013 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.713 MCC: 0.568 Unknown/abstention proportion: 0.004 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.41 0.40 0.41 30  HIV 0.73 0.67 0.70 55 Healthy/Background 0.78 0.85 0.82 115  Lupus 0.71 0.60 0.65 40  Unknown 0.00 0.00 0.00 0  accuracy 0.71 240  macro avg 0.53 0.50 0.51 240  weighted avg 0.71 0.71 0.71 240,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.882 +/- 0.016 (in 3 folds) ROC-AUC (macro OvO): 0.879 +/- 0.021 (in 3 folds) au-PRC (weighted OvO): 0.853 +/- 0.029 (in 3 folds) au-PRC (macro OvO): 0.856 +/- 0.028 (in 3 folds) Accuracy: 0.603 +/- 0.102 (in 3 folds) MCC: 0.371 +/- 0.180 (in 3 folds) Global scores without abstention: Accuracy: 0.603 MCC: 0.374 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.886 +/- 0.020 (in 2 folds) ROC-AUC (macro OvO): 0.887 +/- 0.021 (in 2 folds) au-PRC (weighted OvO): 0.851 +/- 0.041 (in 2 folds) au-PRC (macro OvO): 0.859 +/- 0.039 (in 2 folds) Accuracy: 0.600 +/- 0.105 (in 3 folds) MCC: 0.371 +/- 0.179 (in 3 folds) Unknown/abstention proportion: 0.013 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.600 MCC: 0.372 Unknown/abstention proportion: 0.004 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 1.00 0.03 0.06 30  HIV 0.74 0.42 0.53 55 Healthy/Background 0.57 0.97 0.72 115  Lupus 0.80 0.20 0.32 40  Unknown 0.00 0.00 0.00 0  accuracy 0.60 240  macro avg 0.62 0.33 0.33 240  weighted avg 0.70 0.60 0.53 240,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.876 +/- 0.027 (in 3 folds) ROC-AUC (macro OvO): 0.876 +/- 0.035 (in 3 folds) au-PRC (weighted OvO): 0.864 +/- 0.030 (in 3 folds) au-PRC (macro OvO): 0.870 +/- 0.033 (in 3 folds) Accuracy: 0.615 +/- 0.049 (in 3 folds) MCC: 0.388 +/- 0.104 (in 3 folds) Global scores without abstention: Accuracy: 0.615 MCC: 0.392 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.892 +/- 0.004 (in 2 folds) ROC-AUC (macro OvO): 0.896 +/- 0.003 (in 2 folds) au-PRC (weighted OvO): 0.881 +/- 0.002 (in 2 folds) au-PRC (macro OvO): 0.889 +/- 0.001 (in 2 folds) Accuracy: 0.612 +/- 0.050 (in 3 folds) MCC: 0.387 +/- 0.104 (in 3 folds) Unknown/abstention proportion: 0.013 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.613 MCC: 0.390 Unknown/abstention proportion: 0.004 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.67 0.13 0.22 30  HIV 0.71 0.49 0.58 55 Healthy/Background 0.58 0.93 0.71 115  Lupus 1.00 0.23 0.37 40  Unknown 0.00 0.00 0.00 0  accuracy 0.61 240  macro avg 0.59 0.36 0.38 240  weighted avg 0.69 0.61 0.56 240,Per-fold scores: ROC-AUC (weighted OvO): 0.531 +/- 0.035 (in 3 folds) ROC-AUC (macro OvO): 0.523 +/- 0.032 (in 3 folds) au-PRC (weighted OvO): 0.529 +/- 0.023 (in 3 folds) au-PRC (macro OvO): 0.526 +/- 0.020 (in 3 folds) Accuracy: 0.405 +/- 0.062 (in 3 folds) MCC: 0.088 +/- 0.087 (in 3 folds) Global scores: Accuracy: 0.404 MCC: 0.086 Global classification report:  precision recall f1-score support  Covid19 0.06 0.03 0.04 30  HIV 0.39 0.45 0.42 55 Healthy/Background 0.53 0.60 0.57 115  Lupus 0.07 0.05 0.06 40  accuracy 0.40 240  macro avg 0.26 0.28 0.27 240  weighted avg 0.36 0.40 0.38 240
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 3 folds) Accuracy: 0.481 +/- 0.013 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.481 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 2 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 2 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 2 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 2 folds) Accuracy: 0.479 +/- 0.016 (in 3 folds) MCC: 0.015 +/- 0.026 (in 3 folds) Unknown/abstention proportion: 0.013 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.479 MCC: 0.027 Unknown/abstention proportion: 0.004 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  Covid19 0.00 0.00 0.00 30  HIV 0.00 0.00 0.00 55 Healthy/Background 0.48 1.00 0.65 115  Lupus 0.00 0.00 0.00 40  Unknown 0.00 0.00 0.00 0  accuracy 0.48 240  macro avg 0.10 0.20 0.13 240  weighted avg 0.23 0.48 0.31 240


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_cv,0.879 +/- 0.020 (in 3 folds),0.882 +/- 0.025 (in 3 folds),0.850 +/- 0.023 (in 3 folds),0.858 +/- 0.030 (in 3 folds),0.615 +/- 0.079 (in 3 folds),0.411 +/- 0.098 (in 3 folds),0.615,0.407,disease.separate_past_exposures,0.611 +/- 0.077 (in 3 folds),0.408 +/- 0.097 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.882 +/- 0.027 (in 2 folds),0.887 +/- 0.033 (in 2 folds),0.851 +/- 0.032 (in 2 folds),0.863 +/- 0.042 (in 2 folds),0.612,0.404,0.006,Unknown,disease.separate_past_exposures,356.0,2.0,358.0,0.005587,False
lasso_cv.decision_thresholds_tuned,0.879 +/- 0.020 (in 3 folds),0.882 +/- 0.025 (in 3 folds),0.850 +/- 0.023 (in 3 folds),0.858 +/- 0.030 (in 3 folds),0.635 +/- 0.091 (in 3 folds),0.474 +/- 0.156 (in 3 folds),0.635,0.461,disease.separate_past_exposures,0.631 +/- 0.086 (in 3 folds),0.469 +/- 0.150 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.882 +/- 0.027 (in 2 folds),0.887 +/- 0.033 (in 2 folds),0.851 +/- 0.032 (in 2 folds),0.863 +/- 0.042 (in 2 folds),0.631,0.458,0.006,Unknown,disease.separate_past_exposures,356.0,2.0,358.0,0.005587,False
lasso_multiclass,0.876 +/- 0.016 (in 3 folds),0.877 +/- 0.017 (in 3 folds),0.859 +/- 0.025 (in 3 folds),0.865 +/- 0.030 (in 3 folds),0.682 +/- 0.044 (in 3 folds),0.550 +/- 0.050 (in 3 folds),0.683,0.548,disease.separate_past_exposures,0.679 +/- 0.047 (in 3 folds),0.546 +/- 0.053 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.876 +/- 0.023 (in 2 folds),0.880 +/- 0.023 (in 2 folds),0.871 +/- 0.020 (in 2 folds),0.880 +/- 0.023 (in 2 folds),0.679,0.544,0.006,Unknown,disease.separate_past_exposures,356.0,2.0,358.0,0.005587,False
lasso_multiclass.decision_thresholds_tuned,0.876 +/- 0.016 (in 3 folds),0.877 +/- 0.017 (in 3 folds),0.859 +/- 0.025 (in 3 folds),0.865 +/- 0.030 (in 3 folds),0.691 +/- 0.046 (in 3 folds),0.560 +/- 0.052 (in 3 folds),0.691,0.558,disease.separate_past_exposures,0.687 +/- 0.048 (in 3 folds),0.556 +/- 0.053 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.876 +/- 0.023 (in 2 folds),0.880 +/- 0.023 (in 2 folds),0.871 +/- 0.020 (in 2 folds),0.880 +/- 0.023 (in 2 folds),0.687,0.553,0.006,Unknown,disease.separate_past_exposures,356.0,2.0,358.0,0.005587,False
linearsvm_ovr,0.875 +/- 0.018 (in 3 folds),0.873 +/- 0.018 (in 3 folds),0.857 +/- 0.024 (in 3 folds),0.861 +/- 0.029 (in 3 folds),0.682 +/- 0.053 (in 3 folds),0.542 +/- 0.064 (in 3 folds),0.683,0.538,disease.separate_past_exposures,0.678 +/- 0.053 (in 3 folds),0.537 +/- 0.064 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.875 +/- 0.026 (in 2 folds),0.876 +/- 0.025 (in 2 folds),0.867 +/- 0.024 (in 2 folds),0.874 +/- 0.026 (in 2 folds),0.679,0.534,0.006,Unknown,disease.separate_past_exposures,356.0,2.0,358.0,0.005587,False
linearsvm_ovr.decision_thresholds_tuned,0.875 +/- 0.018 (in 3 folds),0.873 +/- 0.018 (in 3 folds),0.857 +/- 0.024 (in 3 folds),0.861 +/- 0.029 (in 3 folds),0.688 +/- 0.050 (in 3 folds),0.556 +/- 0.057 (in 3 folds),0.688,0.554,disease.separate_past_exposures,0.684 +/- 0.051 (in 3 folds),0.552 +/- 0.058 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.875 +/- 0.026 (in 2 folds),0.876 +/- 0.025 (in 2 folds),0.867 +/- 0.024 (in 2 folds),0.874 +/- 0.026 (in 2 folds),0.684,0.55,0.006,Unknown,disease.separate_past_exposures,356.0,2.0,358.0,0.005587,False
ridge_cv,0.874 +/- 0.028 (in 3 folds),0.879 +/- 0.032 (in 3 folds),0.836 +/- 0.031 (in 3 folds),0.847 +/- 0.038 (in 3 folds),0.519 +/- 0.123 (in 3 folds),0.155 +/- 0.269 (in 3 folds),0.52,0.24,disease.separate_past_exposures,0.516 +/- 0.125 (in 3 folds),0.173 +/- 0.255 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.880 +/- 0.037 (in 2 folds),0.889 +/- 0.039 (in 2 folds),0.845 +/- 0.038 (in 2 folds),0.860 +/- 0.043 (in 2 folds),0.517,0.238,0.006,Unknown,disease.separate_past_exposures,356.0,2.0,358.0,0.005587,False
ridge_cv.decision_thresholds_tuned,0.874 +/- 0.028 (in 3 folds),0.879 +/- 0.032 (in 3 folds),0.836 +/- 0.031 (in 3 folds),0.847 +/- 0.038 (in 3 folds),0.502 +/- 0.233 (in 3 folds),0.312 +/- 0.287 (in 3 folds),0.503,0.334,disease.separate_past_exposures,0.499 +/- 0.231 (in 3 folds),0.308 +/- 0.286 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.880 +/- 0.037 (in 2 folds),0.889 +/- 0.039 (in 2 folds),0.845 +/- 0.038 (in 2 folds),0.860 +/- 0.043 (in 2 folds),0.5,0.33,0.006,Unknown,disease.separate_past_exposures,356.0,2.0,358.0,0.005587,False
rf_multiclass,0.874 +/- 0.009 (in 3 folds),0.874 +/- 0.011 (in 3 folds),0.853 +/- 0.017 (in 3 folds),0.858 +/- 0.022 (in 3 folds),0.680 +/- 0.039 (in 3 folds),0.530 +/- 0.046 (in 3 folds),0.68,0.527,disease.separate_past_exposures,0.676 +/- 0.037 (in 3 folds),0.526 +/- 0.043 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.873 +/- 0.013 (in 2 folds),0.875 +/- 0.015 (in 2 folds),0.862 +/- 0.012 (in 2 folds),0.869 +/- 0.017 (in 2 folds),0.676,0.524,0.006,Unknown,disease.separate_past_exposures,356.0,2.0,358.0,0.005587,False
rf_multiclass.decision_thresholds_tuned,0.874 +/- 0.009 (in 3 folds),0.874 +/- 0.011 (in 3 folds),0.853 +/- 0.017 (in 3 folds),0.858 +/- 0.022 (in 3 folds),0.691 +/- 0.030 (in 3 folds),0.564 +/- 0.032 (in 3 folds),0.691,0.561,disease.separate_past_exposures,0.687 +/- 0.034 (in 3 folds),0.560 +/- 0.036 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.873 +/- 0.013 (in 2 folds),0.875 +/- 0.015 (in 2 folds),0.862 +/- 0.012 (in 2 folds),0.869 +/- 0.017 (in 2 folds),0.687,0.557,0.006,Unknown,disease.separate_past_exposures,356.0,2.0,358.0,0.005587,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_cv,0.879 +/- 0.020 (in 3 folds),0.882 +/- 0.025 (in 3 folds),0.850 +/- 0.023 (in 3 folds),0.858 +/- 0.030 (in 3 folds),0.615 +/- 0.079 (in 3 folds),0.411 +/- 0.098 (in 3 folds),0.615,0.407,disease.separate_past_exposures,0.611 +/- 0.077 (in 3 folds),0.408 +/- 0.097 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.882 +/- 0.027 (in 2 folds),0.887 +/- 0.033 (in 2 folds),0.851 +/- 0.032 (in 2 folds),0.863 +/- 0.042 (in 2 folds),0.612,0.404,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
lasso_cv.decision_thresholds_tuned,0.879 +/- 0.020 (in 3 folds),0.882 +/- 0.025 (in 3 folds),0.850 +/- 0.023 (in 3 folds),0.858 +/- 0.030 (in 3 folds),0.635 +/- 0.091 (in 3 folds),0.474 +/- 0.156 (in 3 folds),0.635,0.461,disease.separate_past_exposures,0.631 +/- 0.086 (in 3 folds),0.469 +/- 0.150 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.882 +/- 0.027 (in 2 folds),0.887 +/- 0.033 (in 2 folds),0.851 +/- 0.032 (in 2 folds),0.863 +/- 0.042 (in 2 folds),0.631,0.458,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
lasso_multiclass,0.876 +/- 0.016 (in 3 folds),0.877 +/- 0.017 (in 3 folds),0.859 +/- 0.025 (in 3 folds),0.865 +/- 0.030 (in 3 folds),0.682 +/- 0.044 (in 3 folds),0.550 +/- 0.050 (in 3 folds),0.683,0.548,disease.separate_past_exposures,0.679 +/- 0.047 (in 3 folds),0.546 +/- 0.053 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.876 +/- 0.023 (in 2 folds),0.880 +/- 0.023 (in 2 folds),0.871 +/- 0.020 (in 2 folds),0.880 +/- 0.023 (in 2 folds),0.679,0.544,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
lasso_multiclass.decision_thresholds_tuned,0.876 +/- 0.016 (in 3 folds),0.877 +/- 0.017 (in 3 folds),0.859 +/- 0.025 (in 3 folds),0.865 +/- 0.030 (in 3 folds),0.691 +/- 0.046 (in 3 folds),0.560 +/- 0.052 (in 3 folds),0.691,0.558,disease.separate_past_exposures,0.687 +/- 0.048 (in 3 folds),0.556 +/- 0.053 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.876 +/- 0.023 (in 2 folds),0.880 +/- 0.023 (in 2 folds),0.871 +/- 0.020 (in 2 folds),0.880 +/- 0.023 (in 2 folds),0.687,0.553,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
linearsvm_ovr,0.875 +/- 0.018 (in 3 folds),0.873 +/- 0.018 (in 3 folds),0.857 +/- 0.024 (in 3 folds),0.861 +/- 0.029 (in 3 folds),0.682 +/- 0.053 (in 3 folds),0.542 +/- 0.064 (in 3 folds),0.683,0.538,disease.separate_past_exposures,0.678 +/- 0.053 (in 3 folds),0.537 +/- 0.064 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.875 +/- 0.026 (in 2 folds),0.876 +/- 0.025 (in 2 folds),0.867 +/- 0.024 (in 2 folds),0.874 +/- 0.026 (in 2 folds),0.679,0.534,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
linearsvm_ovr.decision_thresholds_tuned,0.875 +/- 0.018 (in 3 folds),0.873 +/- 0.018 (in 3 folds),0.857 +/- 0.024 (in 3 folds),0.861 +/- 0.029 (in 3 folds),0.688 +/- 0.050 (in 3 folds),0.556 +/- 0.057 (in 3 folds),0.688,0.554,disease.separate_past_exposures,0.684 +/- 0.051 (in 3 folds),0.552 +/- 0.058 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.875 +/- 0.026 (in 2 folds),0.876 +/- 0.025 (in 2 folds),0.867 +/- 0.024 (in 2 folds),0.874 +/- 0.026 (in 2 folds),0.684,0.55,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
ridge_cv,0.874 +/- 0.028 (in 3 folds),0.879 +/- 0.032 (in 3 folds),0.836 +/- 0.031 (in 3 folds),0.847 +/- 0.038 (in 3 folds),0.519 +/- 0.123 (in 3 folds),0.155 +/- 0.269 (in 3 folds),0.52,0.24,disease.separate_past_exposures,0.516 +/- 0.125 (in 3 folds),0.173 +/- 0.255 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.880 +/- 0.037 (in 2 folds),0.889 +/- 0.039 (in 2 folds),0.845 +/- 0.038 (in 2 folds),0.860 +/- 0.043 (in 2 folds),0.517,0.238,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
ridge_cv.decision_thresholds_tuned,0.874 +/- 0.028 (in 3 folds),0.879 +/- 0.032 (in 3 folds),0.836 +/- 0.031 (in 3 folds),0.847 +/- 0.038 (in 3 folds),0.502 +/- 0.233 (in 3 folds),0.312 +/- 0.287 (in 3 folds),0.503,0.334,disease.separate_past_exposures,0.499 +/- 0.231 (in 3 folds),0.308 +/- 0.286 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.880 +/- 0.037 (in 2 folds),0.889 +/- 0.039 (in 2 folds),0.845 +/- 0.038 (in 2 folds),0.860 +/- 0.043 (in 2 folds),0.5,0.33,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
rf_multiclass,0.874 +/- 0.009 (in 3 folds),0.874 +/- 0.011 (in 3 folds),0.853 +/- 0.017 (in 3 folds),0.858 +/- 0.022 (in 3 folds),0.680 +/- 0.039 (in 3 folds),0.530 +/- 0.046 (in 3 folds),0.68,0.527,disease.separate_past_exposures,0.676 +/- 0.037 (in 3 folds),0.526 +/- 0.043 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.873 +/- 0.013 (in 2 folds),0.875 +/- 0.015 (in 2 folds),0.862 +/- 0.012 (in 2 folds),0.869 +/- 0.017 (in 2 folds),0.676,0.524,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False
rf_multiclass.decision_thresholds_tuned,0.874 +/- 0.009 (in 3 folds),0.874 +/- 0.011 (in 3 folds),0.853 +/- 0.017 (in 3 folds),0.858 +/- 0.022 (in 3 folds),0.691 +/- 0.030 (in 3 folds),0.564 +/- 0.032 (in 3 folds),0.691,0.561,disease.separate_past_exposures,0.687 +/- 0.034 (in 3 folds),0.560 +/- 0.036 (in 3 folds),0.017 +/- 0.000 (in 1 folds),0.873 +/- 0.013 (in 2 folds),0.875 +/- 0.015 (in 2 folds),0.862 +/- 0.012 (in 2 folds),0.869 +/- 0.017 (in 2 folds),0.687,0.557,0.006,Unknown,disease.separate_past_exposures,356,2,358,0.005587,False


lasso_cv,lasso_cv.decision_thresholds_tuned,lasso_multiclass,lasso_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.879 +/- 0.020 (in 3 folds) ROC-AUC (macro OvO): 0.882 +/- 0.025 (in 3 folds) au-PRC (weighted OvO): 0.850 +/- 0.023 (in 3 folds) au-PRC (macro OvO): 0.858 +/- 0.030 (in 3 folds) Accuracy: 0.615 +/- 0.079 (in 3 folds) MCC: 0.411 +/- 0.098 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.615 MCC: 0.407 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.611 +/- 0.077 (in 3 folds) MCC: 0.408 +/- 0.097 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.882 +/- 0.027 (in 2 folds) ROC-AUC (macro OvO): 0.887 +/- 0.033 (in 2 folds) au-PRC (weighted OvO): 0.851 +/- 0.032 (in 2 folds) au-PRC (macro OvO): 0.863 +/- 0.042 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.612 MCC: 0.404 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.75 0.14 0.24 43  HIV 0.76 0.54 0.63 87 Healthy/Background 0.56 0.91 0.69 165  Lupus 0.89 0.25 0.40 63  Unknown 0.00 0.00 0.00 0  accuracy 0.61 358  macro avg 0.59 0.37 0.39 358  weighted avg 0.69 0.61 0.57 358,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.879 +/- 0.020 (in 3 folds) ROC-AUC (macro OvO): 0.882 +/- 0.025 (in 3 folds) au-PRC (weighted OvO): 0.850 +/- 0.023 (in 3 folds) au-PRC (macro OvO): 0.858 +/- 0.030 (in 3 folds) Accuracy: 0.635 +/- 0.091 (in 3 folds) MCC: 0.474 +/- 0.156 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.635 MCC: 0.461 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.631 +/- 0.086 (in 3 folds) MCC: 0.469 +/- 0.150 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.882 +/- 0.027 (in 2 folds) ROC-AUC (macro OvO): 0.887 +/- 0.033 (in 2 folds) au-PRC (weighted OvO): 0.851 +/- 0.032 (in 2 folds) au-PRC (macro OvO): 0.863 +/- 0.042 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.631 MCC: 0.458 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.46 0.42 0.44 43  HIV 0.69 0.63 0.66 87 Healthy/Background 0.67 0.70 0.68 165  Lupus 0.58 0.60 0.59 63  Unknown 0.00 0.00 0.00 0  accuracy 0.63 358  macro avg 0.48 0.47 0.47 358  weighted avg 0.63 0.63 0.63 358,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.876 +/- 0.016 (in 3 folds) ROC-AUC (macro OvO): 0.877 +/- 0.017 (in 3 folds) au-PRC (weighted OvO): 0.859 +/- 0.025 (in 3 folds) au-PRC (macro OvO): 0.865 +/- 0.030 (in 3 folds) Accuracy: 0.682 +/- 0.044 (in 3 folds) MCC: 0.550 +/- 0.050 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.683 MCC: 0.548 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.679 +/- 0.047 (in 3 folds) MCC: 0.546 +/- 0.053 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.876 +/- 0.023 (in 2 folds) ROC-AUC (macro OvO): 0.880 +/- 0.023 (in 2 folds) au-PRC (weighted OvO): 0.871 +/- 0.020 (in 2 folds) au-PRC (macro OvO): 0.880 +/- 0.023 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.679 MCC: 0.544 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.48 0.77 0.59 43  HIV 0.66 0.60 0.63 87 Healthy/Background 0.78 0.72 0.74 165  Lupus 0.71 0.63 0.67 63  Unknown 0.00 0.00 0.00 0  accuracy 0.68 358  macro avg 0.53 0.54 0.53 358  weighted avg 0.70 0.68 0.68 358,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.876 +/- 0.016 (in 3 folds) ROC-AUC (macro OvO): 0.877 +/- 0.017 (in 3 folds) au-PRC (weighted OvO): 0.859 +/- 0.025 (in 3 folds) au-PRC (macro OvO): 0.865 +/- 0.030 (in 3 folds) Accuracy: 0.691 +/- 0.046 (in 3 folds) MCC: 0.560 +/- 0.052 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.691 MCC: 0.558 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.687 +/- 0.048 (in 3 folds) MCC: 0.556 +/- 0.053 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.876 +/- 0.023 (in 2 folds) ROC-AUC (macro OvO): 0.880 +/- 0.023 (in 2 folds) au-PRC (weighted OvO): 0.871 +/- 0.020 (in 2 folds) au-PRC (macro OvO): 0.880 +/- 0.023 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.687 MCC: 0.553 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.48 0.79 0.60 43  HIV 0.68 0.62 0.65 87 Healthy/Background 0.77 0.75 0.76 165  Lupus 0.76 0.56 0.64 63  Unknown 0.00 0.00 0.00 0  accuracy 0.69 358  macro avg 0.54 0.54 0.53 358  weighted avg 0.71 0.69 0.69 358
,,,


linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned,ridge_cv,ridge_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.875 +/- 0.018 (in 3 folds) ROC-AUC (macro OvO): 0.873 +/- 0.018 (in 3 folds) au-PRC (weighted OvO): 0.857 +/- 0.024 (in 3 folds) au-PRC (macro OvO): 0.861 +/- 0.029 (in 3 folds) Accuracy: 0.682 +/- 0.053 (in 3 folds) MCC: 0.542 +/- 0.064 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.683 MCC: 0.538 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.678 +/- 0.053 (in 3 folds) MCC: 0.537 +/- 0.064 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.875 +/- 0.026 (in 2 folds) ROC-AUC (macro OvO): 0.876 +/- 0.025 (in 2 folds) au-PRC (weighted OvO): 0.867 +/- 0.024 (in 2 folds) au-PRC (macro OvO): 0.874 +/- 0.026 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.679 MCC: 0.534 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.50 0.74 0.60 43  HIV 0.66 0.55 0.60 87 Healthy/Background 0.74 0.76 0.75 165  Lupus 0.77 0.59 0.67 63  Unknown 0.00 0.00 0.00 0  accuracy 0.68 358  macro avg 0.53 0.53 0.52 358  weighted avg 0.70 0.68 0.68 358,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.875 +/- 0.018 (in 3 folds) ROC-AUC (macro OvO): 0.873 +/- 0.018 (in 3 folds) au-PRC (weighted OvO): 0.857 +/- 0.024 (in 3 folds) au-PRC (macro OvO): 0.861 +/- 0.029 (in 3 folds) Accuracy: 0.688 +/- 0.050 (in 3 folds) MCC: 0.556 +/- 0.057 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.688 MCC: 0.554 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.684 +/- 0.051 (in 3 folds) MCC: 0.552 +/- 0.058 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.875 +/- 0.026 (in 2 folds) ROC-AUC (macro OvO): 0.876 +/- 0.025 (in 2 folds) au-PRC (weighted OvO): 0.867 +/- 0.024 (in 2 folds) au-PRC (macro OvO): 0.874 +/- 0.026 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.684 MCC: 0.550 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.47 0.79 0.59 43  HIV 0.66 0.63 0.65 87 Healthy/Background 0.77 0.75 0.76 165  Lupus 0.80 0.52 0.63 63  Unknown 0.00 0.00 0.00 0  accuracy 0.68 358  macro avg 0.54 0.54 0.53 358  weighted avg 0.72 0.68 0.69 358,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.874 +/- 0.028 (in 3 folds) ROC-AUC (macro OvO): 0.879 +/- 0.032 (in 3 folds) au-PRC (weighted OvO): 0.836 +/- 0.031 (in 3 folds) au-PRC (macro OvO): 0.847 +/- 0.038 (in 3 folds) Accuracy: 0.519 +/- 0.123 (in 3 folds) MCC: 0.155 +/- 0.269 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.520 MCC: 0.240 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.516 +/- 0.125 (in 3 folds) MCC: 0.173 +/- 0.255 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.880 +/- 0.037 (in 2 folds) ROC-AUC (macro OvO): 0.889 +/- 0.039 (in 2 folds) au-PRC (weighted OvO): 0.845 +/- 0.038 (in 2 folds) au-PRC (macro OvO): 0.860 +/- 0.043 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.517 MCC: 0.238 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 1.00 0.12 0.21 43  HIV 0.78 0.16 0.27 87 Healthy/Background 0.49 0.98 0.65 165  Lupus 1.00 0.08 0.15 63  Unknown 0.00 0.00 0.00 0  accuracy 0.52 358  macro avg 0.65 0.27 0.26 358  weighted avg 0.71 0.52 0.42 358,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.874 +/- 0.028 (in 3 folds) ROC-AUC (macro OvO): 0.879 +/- 0.032 (in 3 folds) au-PRC (weighted OvO): 0.836 +/- 0.031 (in 3 folds) au-PRC (macro OvO): 0.847 +/- 0.038 (in 3 folds) Accuracy: 0.502 +/- 0.233 (in 3 folds) MCC: 0.312 +/- 0.287 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.503 MCC: 0.334 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.499 +/- 0.231 (in 3 folds) MCC: 0.308 +/- 0.286 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.880 +/- 0.037 (in 2 folds) ROC-AUC (macro OvO): 0.889 +/- 0.039 (in 2 folds) au-PRC (weighted OvO): 0.845 +/- 0.038 (in 2 folds) au-PRC (macro OvO): 0.860 +/- 0.043 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.500 MCC: 0.330 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.52 0.30 0.38 43  HIV 0.36 0.85 0.50 87 Healthy/Background 0.75 0.48 0.59 165  Lupus 0.67 0.19 0.30 63  Unknown 0.00 0.00 0.00 0  accuracy 0.50 358  macro avg 0.46 0.37 0.35 358  weighted avg 0.61 0.50 0.49 358
,,,


rf_multiclass,rf_multiclass.decision_thresholds_tuned,xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.874 +/- 0.009 (in 3 folds) ROC-AUC (macro OvO): 0.874 +/- 0.011 (in 3 folds) au-PRC (weighted OvO): 0.853 +/- 0.017 (in 3 folds) au-PRC (macro OvO): 0.858 +/- 0.022 (in 3 folds) Accuracy: 0.680 +/- 0.039 (in 3 folds) MCC: 0.530 +/- 0.046 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.680 MCC: 0.527 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.676 +/- 0.037 (in 3 folds) MCC: 0.526 +/- 0.043 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.873 +/- 0.013 (in 2 folds) ROC-AUC (macro OvO): 0.875 +/- 0.015 (in 2 folds) au-PRC (weighted OvO): 0.862 +/- 0.012 (in 2 folds) au-PRC (macro OvO): 0.869 +/- 0.017 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.676 MCC: 0.524 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.52 0.60 0.56 43  HIV 0.63 0.55 0.59 87 Healthy/Background 0.74 0.79 0.76 165  Lupus 0.70 0.60 0.65 63  Unknown 0.00 0.00 0.00 0  accuracy 0.68 358  macro avg 0.52 0.51 0.51 358  weighted avg 0.68 0.68 0.68 358,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.874 +/- 0.009 (in 3 folds) ROC-AUC (macro OvO): 0.874 +/- 0.011 (in 3 folds) au-PRC (weighted OvO): 0.853 +/- 0.017 (in 3 folds) au-PRC (macro OvO): 0.858 +/- 0.022 (in 3 folds) Accuracy: 0.691 +/- 0.030 (in 3 folds) MCC: 0.564 +/- 0.032 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.691 MCC: 0.561 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.687 +/- 0.034 (in 3 folds) MCC: 0.560 +/- 0.036 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.873 +/- 0.013 (in 2 folds) ROC-AUC (macro OvO): 0.875 +/- 0.015 (in 2 folds) au-PRC (weighted OvO): 0.862 +/- 0.012 (in 2 folds) au-PRC (macro OvO): 0.869 +/- 0.017 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.687 MCC: 0.557 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.47 0.81 0.59 43  HIV 0.67 0.57 0.62 87 Healthy/Background 0.78 0.73 0.75 165  Lupus 0.80 0.63 0.71 63  Unknown 0.00 0.00 0.00 0  accuracy 0.69 358  macro avg 0.54 0.55 0.53 358  weighted avg 0.72 0.69 0.69 358,Per-fold scores: ROC-AUC (weighted OvO): 0.865 +/- 0.021 (in 3 folds) ROC-AUC (macro OvO): 0.868 +/- 0.020 (in 3 folds) au-PRC (weighted OvO): 0.859 +/- 0.024 (in 3 folds) au-PRC (macro OvO): 0.866 +/- 0.021 (in 3 folds) Accuracy: 0.668 +/- 0.015 (in 3 folds) MCC: 0.517 +/- 0.017 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.668 MCC: 0.514 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.54 0.70 0.61 43  HIV 0.62 0.52 0.56 87 Healthy/Background 0.71 0.75 0.73 165  Lupus 0.73 0.65 0.69 63  accuracy 0.67 358  macro avg 0.65 0.65 0.65 358  weighted avg 0.67 0.67 0.67 358,Per-fold scores: ROC-AUC (weighted OvO): 0.865 +/- 0.021 (in 3 folds) ROC-AUC (macro OvO): 0.868 +/- 0.020 (in 3 folds) au-PRC (weighted OvO): 0.859 +/- 0.024 (in 3 folds) au-PRC (macro OvO): 0.866 +/- 0.021 (in 3 folds) Accuracy: 0.676 +/- 0.029 (in 3 folds) MCC: 0.536 +/- 0.043 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.676 MCC: 0.533 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.57 0.67 0.62 43  HIV 0.58 0.66 0.61 87 Healthy/Background 0.76 0.71 0.74 165  Lupus 0.71 0.62 0.66 63  accuracy 0.68 358  macro avg 0.65 0.66 0.66 358  weighted avg 0.69 0.68 0.68 358
,,,


elasticnet_cv,elasticnet_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.864 +/- 0.034 (in 3 folds) ROC-AUC (macro OvO): 0.864 +/- 0.040 (in 3 folds) au-PRC (weighted OvO): 0.837 +/- 0.029 (in 3 folds) au-PRC (macro OvO): 0.843 +/- 0.039 (in 3 folds) Accuracy: 0.556 +/- 0.043 (in 3 folds) MCC: 0.288 +/- 0.110 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.556 MCC: 0.296 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.553 +/- 0.048 (in 3 folds) MCC: 0.288 +/- 0.111 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.869 +/- 0.046 (in 2 folds) ROC-AUC (macro OvO): 0.874 +/- 0.052 (in 2 folds) au-PRC (weighted OvO): 0.846 +/- 0.034 (in 2 folds) au-PRC (macro OvO): 0.856 +/- 0.044 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.553 MCC: 0.295 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 1.00 0.02 0.05 43  HIV 0.68 0.37 0.48 87 Healthy/Background 0.52 0.92 0.67 165  Lupus 0.72 0.21 0.32 63  Unknown 0.00 0.00 0.00 0  accuracy 0.55 358  macro avg 0.59 0.30 0.30 358  weighted avg 0.65 0.55 0.49 358,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.864 +/- 0.034 (in 3 folds) ROC-AUC (macro OvO): 0.864 +/- 0.040 (in 3 folds) au-PRC (weighted OvO): 0.837 +/- 0.029 (in 3 folds) au-PRC (macro OvO): 0.843 +/- 0.039 (in 3 folds) Accuracy: 0.621 +/- 0.025 (in 3 folds) MCC: 0.468 +/- 0.033 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.621 MCC: 0.460 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.617 +/- 0.024 (in 3 folds) MCC: 0.463 +/- 0.034 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.869 +/- 0.046 (in 2 folds) ROC-AUC (macro OvO): 0.874 +/- 0.052 (in 2 folds) au-PRC (weighted OvO): 0.846 +/- 0.034 (in 2 folds) au-PRC (macro OvO): 0.856 +/- 0.044 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.617 MCC: 0.457 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.52 0.35 0.42 43  HIV 0.57 0.74 0.64 87 Healthy/Background 0.75 0.62 0.68 165  Lupus 0.51 0.62 0.56 63  Unknown 0.00 0.00 0.00 0  accuracy 0.62 358  macro avg 0.47 0.47 0.46 358  weighted avg 0.63 0.62 0.62 358
,


---

# GeneLocus.TCR, TargetObsColumnEnum.ethnicity_condensed_healthy_only trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
xgboost,0.702 +/- 0.041 (in 3 folds),0.690 +/- 0.038 (in 3 folds),0.709 +/- 0.024 (in 3 folds),0.707 +/- 0.009 (in 3 folds),0.601 +/- 0.097 (in 3 folds),0.357 +/- 0.084 (in 3 folds),0.598,0.345,0.556 +/- 0.053 (in 3 folds),0.296 +/- 0.028 (in 3 folds),0.103 +/- 0.036 (in 2 folds),0.657 +/- 0.000 (in 1 folds),0.651 +/- 0.000 (in 1 folds),0.685 +/- 0.000 (in 1 folds),0.703 +/- 0.000 (in 1 folds),0.557,0.273,0.07,Unknown,107.0,8.0,115.0,0.069565,False
linearsvm_ovr,0.692 +/- 0.052 (in 3 folds),0.697 +/- 0.058 (in 3 folds),0.716 +/- 0.018 (in 3 folds),0.725 +/- 0.040 (in 3 folds),0.583 +/- 0.078 (in 3 folds),0.331 +/- 0.086 (in 3 folds),0.584,0.338,0.573 +/- 0.082 (in 3 folds),0.295 +/- 0.029 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.718 +/- 0.038 (in 2 folds),0.723 +/- 0.050 (in 2 folds),0.712 +/- 0.024 (in 2 folds),0.727 +/- 0.056 (in 2 folds),0.574,0.292,0.017,Unknown,113.0,2.0,115.0,0.017391,True
lasso_multiclass,0.673 +/- 0.018 (in 3 folds),0.662 +/- 0.012 (in 3 folds),0.684 +/- 0.015 (in 3 folds),0.673 +/- 0.010 (in 3 folds),0.600 +/- 0.090 (in 3 folds),0.371 +/- 0.103 (in 3 folds),0.602,0.382,0.590 +/- 0.092 (in 3 folds),0.337 +/- 0.064 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.683 +/- 0.005 (in 2 folds),0.668 +/- 0.005 (in 2 folds),0.683 +/- 0.022 (in 2 folds),0.675 +/- 0.013 (in 2 folds),0.591,0.336,0.017,Unknown,113.0,2.0,115.0,0.017391,True
lasso_cv,0.622 +/- 0.073 (in 3 folds),0.612 +/- 0.068 (in 3 folds),0.669 +/- 0.052 (in 3 folds),0.663 +/- 0.048 (in 3 folds),0.541 +/- 0.133 (in 3 folds),0.273 +/- 0.104 (in 3 folds),0.546,0.263,0.512 +/- 0.157 (in 3 folds),0.168 +/- 0.186 (in 3 folds),0.093 +/- 0.022 (in 2 folds),0.645 +/- 0.000 (in 1 folds),0.639 +/- 0.000 (in 1 folds),0.685 +/- 0.000 (in 1 folds),0.688 +/- 0.000 (in 1 folds),0.513,0.154,0.061,Unknown,108.0,7.0,115.0,0.06087,True
rf_multiclass,0.612 +/- 0.089 (in 3 folds),0.609 +/- 0.066 (in 3 folds),0.640 +/- 0.048 (in 3 folds),0.629 +/- 0.038 (in 3 folds),0.597 +/- 0.145 (in 3 folds),0.381 +/- 0.173 (in 3 folds),0.591,0.365,0.564 +/- 0.089 (in 3 folds),0.319 +/- 0.068 (in 3 folds),0.128 +/- 0.000 (in 1 folds),0.562 +/- 0.025 (in 2 folds),0.572 +/- 0.024 (in 2 folds),0.614 +/- 0.028 (in 2 folds),0.610 +/- 0.027 (in 2 folds),0.565,0.284,0.043,Unknown,110.0,5.0,115.0,0.043478,True
elasticnet_cv,0.596 +/- 0.061 (in 3 folds),0.591 +/- 0.072 (in 3 folds),0.656 +/- 0.046 (in 3 folds),0.659 +/- 0.067 (in 3 folds),0.529 +/- 0.122 (in 3 folds),0.196 +/- 0.172 (in 3 folds),0.532,0.221,0.512 +/- 0.134 (in 3 folds),0.136 +/- 0.167 (in 3 folds),0.108 +/- 0.000 (in 1 folds),0.623 +/- 0.056 (in 2 folds),0.620 +/- 0.073 (in 2 folds),0.677 +/- 0.039 (in 2 folds),0.685 +/- 0.071 (in 2 folds),0.513,0.128,0.035,Unknown,111.0,4.0,115.0,0.034783,True
ridge_cv,0.575 +/- 0.068 (in 3 folds),0.559 +/- 0.051 (in 3 folds),0.617 +/- 0.103 (in 3 folds),0.608 +/- 0.095 (in 3 folds),0.504 +/- 0.099 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.5,0.0,0.478 +/- 0.054 (in 3 folds),0.002 +/- 0.003 (in 3 folds),0.128 +/- 0.000 (in 1 folds),0.547 +/- 0.067 (in 2 folds),0.544 +/- 0.063 (in 2 folds),0.578 +/- 0.110 (in 2 folds),0.572 +/- 0.102 (in 2 folds),0.478,-0.018,0.043,Unknown,110.0,5.0,115.0,0.043478,True
dummy_stratified,0.504 +/- 0.027 (in 3 folds),0.501 +/- 0.025 (in 3 folds),0.515 +/- 0.017 (in 3 folds),0.512 +/- 0.014 (in 3 folds),0.424 +/- 0.042 (in 3 folds),0.030 +/- 0.067 (in 3 folds),0.429,0.038,0.392 +/- 0.096 (in 3 folds),0.009 +/- 0.053 (in 3 folds),0.256 +/- 0.000 (in 1 folds),0.494 +/- 0.031 (in 2 folds),0.494 +/- 0.030 (in 2 folds),0.506 +/- 0.008 (in 2 folds),0.504 +/- 0.008 (in 2 folds),0.391,0.019,0.087,Unknown,105.0,10.0,115.0,0.086957,True
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.504 +/- 0.099 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.5,0.0,0.478 +/- 0.054 (in 3 folds),0.002 +/- 0.003 (in 3 folds),0.128 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.478,-0.018,0.043,Unknown,110.0,5.0,115.0,0.043478,True
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
xgboost,0.702 +/- 0.041 (in 3 folds),0.690 +/- 0.038 (in 3 folds),0.709 +/- 0.024 (in 3 folds),0.707 +/- 0.009 (in 3 folds),0.601 +/- 0.097 (in 3 folds),0.357 +/- 0.084 (in 3 folds),0.598,0.345,0.556 +/- 0.053 (in 3 folds),0.296 +/- 0.028 (in 3 folds),0.103 +/- 0.036 (in 2 folds),0.657 +/- 0.000 (in 1 folds),0.651 +/- 0.000 (in 1 folds),0.685 +/- 0.000 (in 1 folds),0.703 +/- 0.000 (in 1 folds),0.557,0.273,0.07,Unknown,107,8,115,0.069565,False
linearsvm_ovr,0.692 +/- 0.052 (in 3 folds),0.697 +/- 0.058 (in 3 folds),0.716 +/- 0.018 (in 3 folds),0.725 +/- 0.040 (in 3 folds),0.583 +/- 0.078 (in 3 folds),0.331 +/- 0.086 (in 3 folds),0.584,0.338,0.573 +/- 0.082 (in 3 folds),0.295 +/- 0.029 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.718 +/- 0.038 (in 2 folds),0.723 +/- 0.050 (in 2 folds),0.712 +/- 0.024 (in 2 folds),0.727 +/- 0.056 (in 2 folds),0.574,0.292,0.017,Unknown,113,2,115,0.017391,True
lasso_multiclass,0.673 +/- 0.018 (in 3 folds),0.662 +/- 0.012 (in 3 folds),0.684 +/- 0.015 (in 3 folds),0.673 +/- 0.010 (in 3 folds),0.600 +/- 0.090 (in 3 folds),0.371 +/- 0.103 (in 3 folds),0.602,0.382,0.590 +/- 0.092 (in 3 folds),0.337 +/- 0.064 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.683 +/- 0.005 (in 2 folds),0.668 +/- 0.005 (in 2 folds),0.683 +/- 0.022 (in 2 folds),0.675 +/- 0.013 (in 2 folds),0.591,0.336,0.017,Unknown,113,2,115,0.017391,True
lasso_cv,0.622 +/- 0.073 (in 3 folds),0.612 +/- 0.068 (in 3 folds),0.669 +/- 0.052 (in 3 folds),0.663 +/- 0.048 (in 3 folds),0.541 +/- 0.133 (in 3 folds),0.273 +/- 0.104 (in 3 folds),0.546,0.263,0.512 +/- 0.157 (in 3 folds),0.168 +/- 0.186 (in 3 folds),0.093 +/- 0.022 (in 2 folds),0.645 +/- 0.000 (in 1 folds),0.639 +/- 0.000 (in 1 folds),0.685 +/- 0.000 (in 1 folds),0.688 +/- 0.000 (in 1 folds),0.513,0.154,0.061,Unknown,108,7,115,0.06087,True
rf_multiclass,0.612 +/- 0.089 (in 3 folds),0.609 +/- 0.066 (in 3 folds),0.640 +/- 0.048 (in 3 folds),0.629 +/- 0.038 (in 3 folds),0.597 +/- 0.145 (in 3 folds),0.381 +/- 0.173 (in 3 folds),0.591,0.365,0.564 +/- 0.089 (in 3 folds),0.319 +/- 0.068 (in 3 folds),0.128 +/- 0.000 (in 1 folds),0.562 +/- 0.025 (in 2 folds),0.572 +/- 0.024 (in 2 folds),0.614 +/- 0.028 (in 2 folds),0.610 +/- 0.027 (in 2 folds),0.565,0.284,0.043,Unknown,110,5,115,0.043478,True
elasticnet_cv,0.596 +/- 0.061 (in 3 folds),0.591 +/- 0.072 (in 3 folds),0.656 +/- 0.046 (in 3 folds),0.659 +/- 0.067 (in 3 folds),0.529 +/- 0.122 (in 3 folds),0.196 +/- 0.172 (in 3 folds),0.532,0.221,0.512 +/- 0.134 (in 3 folds),0.136 +/- 0.167 (in 3 folds),0.108 +/- 0.000 (in 1 folds),0.623 +/- 0.056 (in 2 folds),0.620 +/- 0.073 (in 2 folds),0.677 +/- 0.039 (in 2 folds),0.685 +/- 0.071 (in 2 folds),0.513,0.128,0.035,Unknown,111,4,115,0.034783,True
ridge_cv,0.575 +/- 0.068 (in 3 folds),0.559 +/- 0.051 (in 3 folds),0.617 +/- 0.103 (in 3 folds),0.608 +/- 0.095 (in 3 folds),0.504 +/- 0.099 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.5,0.0,0.478 +/- 0.054 (in 3 folds),0.002 +/- 0.003 (in 3 folds),0.128 +/- 0.000 (in 1 folds),0.547 +/- 0.067 (in 2 folds),0.544 +/- 0.063 (in 2 folds),0.578 +/- 0.110 (in 2 folds),0.572 +/- 0.102 (in 2 folds),0.478,-0.018,0.043,Unknown,110,5,115,0.043478,True
dummy_stratified,0.504 +/- 0.027 (in 3 folds),0.501 +/- 0.025 (in 3 folds),0.515 +/- 0.017 (in 3 folds),0.512 +/- 0.014 (in 3 folds),0.424 +/- 0.042 (in 3 folds),0.030 +/- 0.067 (in 3 folds),0.429,0.038,0.392 +/- 0.096 (in 3 folds),0.009 +/- 0.053 (in 3 folds),0.256 +/- 0.000 (in 1 folds),0.494 +/- 0.031 (in 2 folds),0.494 +/- 0.030 (in 2 folds),0.506 +/- 0.008 (in 2 folds),0.504 +/- 0.008 (in 2 folds),0.391,0.019,0.087,Unknown,105,10,115,0.086957,True
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.504 +/- 0.099 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.5,0.0,0.478 +/- 0.054 (in 3 folds),0.002 +/- 0.003 (in 3 folds),0.128 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.478,-0.018,0.043,Unknown,110,5,115,0.043478,True


xgboost,linearsvm_ovr,lasso_multiclass,lasso_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.702 +/- 0.041 (in 3 folds) ROC-AUC (macro OvO): 0.690 +/- 0.038 (in 3 folds) au-PRC (weighted OvO): 0.709 +/- 0.024 (in 3 folds) au-PRC (macro OvO): 0.707 +/- 0.009 (in 3 folds) Accuracy: 0.601 +/- 0.097 (in 3 folds) MCC: 0.357 +/- 0.084 (in 3 folds) Global scores without abstention: Accuracy: 0.598 MCC: 0.345 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.556 +/- 0.053 (in 3 folds) MCC: 0.296 +/- 0.028 (in 3 folds) Unknown/abstention proportion: 0.103 +/- 0.036 (in 2 folds) ROC-AUC (weighted OvO): 0.657 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.651 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.685 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.703 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.557 MCC: 0.273 Unknown/abstention proportion: 0.070 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.85 0.50 0.63 22  Asian 0.67 0.13 0.22 30  Caucasian 0.56 0.84 0.68 58 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.56 115  macro avg 0.42 0.30 0.31 115  weighted avg 0.62 0.56 0.52 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.692 +/- 0.052 (in 3 folds) ROC-AUC (macro OvO): 0.697 +/- 0.058 (in 3 folds) au-PRC (weighted OvO): 0.716 +/- 0.018 (in 3 folds) au-PRC (macro OvO): 0.725 +/- 0.040 (in 3 folds) Accuracy: 0.583 +/- 0.078 (in 3 folds) MCC: 0.331 +/- 0.086 (in 3 folds) Global scores without abstention: Accuracy: 0.584 MCC: 0.338 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.573 +/- 0.082 (in 3 folds) MCC: 0.295 +/- 0.029 (in 3 folds) Unknown/abstention proportion: 0.051 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.718 +/- 0.038 (in 2 folds) ROC-AUC (macro OvO): 0.723 +/- 0.050 (in 2 folds) au-PRC (weighted OvO): 0.712 +/- 0.024 (in 2 folds) au-PRC (macro OvO): 0.727 +/- 0.056 (in 2 folds) Global scores with abstention: Accuracy: 0.574 MCC: 0.292 Unknown/abstention proportion: 0.017 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.45 0.62 22  Asian 0.50 0.03 0.06 30  Caucasian 0.54 0.95 0.69 58 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.57 115  macro avg 0.41 0.29 0.28 115  weighted avg 0.60 0.57 0.48 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.673 +/- 0.018 (in 3 folds) ROC-AUC (macro OvO): 0.662 +/- 0.012 (in 3 folds) au-PRC (weighted OvO): 0.684 +/- 0.015 (in 3 folds) au-PRC (macro OvO): 0.673 +/- 0.010 (in 3 folds) Accuracy: 0.600 +/- 0.090 (in 3 folds) MCC: 0.371 +/- 0.103 (in 3 folds) Global scores without abstention: Accuracy: 0.602 MCC: 0.382 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.590 +/- 0.092 (in 3 folds) MCC: 0.337 +/- 0.064 (in 3 folds) Unknown/abstention proportion: 0.051 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.683 +/- 0.005 (in 2 folds) ROC-AUC (macro OvO): 0.668 +/- 0.005 (in 2 folds) au-PRC (weighted OvO): 0.683 +/- 0.022 (in 2 folds) au-PRC (macro OvO): 0.675 +/- 0.013 (in 2 folds) Global scores with abstention: Accuracy: 0.591 MCC: 0.336 Unknown/abstention proportion: 0.017 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.50 0.67 22  Asian 0.50 0.03 0.06 30  Caucasian 0.56 0.97 0.71 58 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.59 115  macro avg 0.41 0.30 0.29 115  weighted avg 0.60 0.59 0.50 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.622 +/- 0.073 (in 3 folds) ROC-AUC (macro OvO): 0.612 +/- 0.068 (in 3 folds) au-PRC (weighted OvO): 0.669 +/- 0.052 (in 3 folds) au-PRC (macro OvO): 0.663 +/- 0.048 (in 3 folds) Accuracy: 0.541 +/- 0.133 (in 3 folds) MCC: 0.273 +/- 0.104 (in 3 folds) Global scores without abstention: Accuracy: 0.546 MCC: 0.263 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.512 +/- 0.157 (in 3 folds) MCC: 0.168 +/- 0.186 (in 3 folds) Unknown/abstention proportion: 0.093 +/- 0.022 (in 2 folds) ROC-AUC (weighted OvO): 0.645 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.639 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.685 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.688 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.513 MCC: 0.154 Unknown/abstention proportion: 0.061 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.27 0.43 22  Asian 0.00 0.00 0.00 30  Caucasian 0.52 0.91 0.67 58 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.51 115  macro avg 0.30 0.24 0.22 115  weighted avg 0.46 0.51 0.42 115
,,,


rf_multiclass,elasticnet_cv,ridge_cv,dummy_stratified
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.612 +/- 0.089 (in 3 folds) ROC-AUC (macro OvO): 0.609 +/- 0.066 (in 3 folds) au-PRC (weighted OvO): 0.640 +/- 0.048 (in 3 folds) au-PRC (macro OvO): 0.629 +/- 0.038 (in 3 folds) Accuracy: 0.597 +/- 0.145 (in 3 folds) MCC: 0.381 +/- 0.173 (in 3 folds) Global scores without abstention: Accuracy: 0.591 MCC: 0.365 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.562 +/- 0.025 (in 2 folds) ROC-AUC (macro OvO): 0.572 +/- 0.024 (in 2 folds) au-PRC (weighted OvO): 0.614 +/- 0.028 (in 2 folds) au-PRC (macro OvO): 0.610 +/- 0.027 (in 2 folds) Accuracy: 0.564 +/- 0.089 (in 3 folds) MCC: 0.319 +/- 0.068 (in 3 folds) Unknown/abstention proportion: 0.128 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.565 MCC: 0.284 Unknown/abstention proportion: 0.043 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.45 0.62 22  Asian 0.00 0.00 0.00 30  Caucasian 0.55 0.95 0.70 58 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.57 115  macro avg 0.31 0.28 0.26 115  weighted avg 0.47 0.57 0.47 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.596 +/- 0.061 (in 3 folds) ROC-AUC (macro OvO): 0.591 +/- 0.072 (in 3 folds) au-PRC (weighted OvO): 0.656 +/- 0.046 (in 3 folds) au-PRC (macro OvO): 0.659 +/- 0.067 (in 3 folds) Accuracy: 0.529 +/- 0.122 (in 3 folds) MCC: 0.196 +/- 0.172 (in 3 folds) Global scores without abstention: Accuracy: 0.532 MCC: 0.221 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.623 +/- 0.056 (in 2 folds) ROC-AUC (macro OvO): 0.620 +/- 0.073 (in 2 folds) au-PRC (weighted OvO): 0.677 +/- 0.039 (in 2 folds) au-PRC (macro OvO): 0.685 +/- 0.071 (in 2 folds) Accuracy: 0.512 +/- 0.134 (in 3 folds) MCC: 0.136 +/- 0.167 (in 3 folds) Unknown/abstention proportion: 0.108 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.513 MCC: 0.128 Unknown/abstention proportion: 0.035 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.18 0.31 22  Asian 0.00 0.00 0.00 30  Caucasian 0.51 0.95 0.67 58 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.51 115  macro avg 0.30 0.23 0.19 115  weighted avg 0.45 0.51 0.40 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.575 +/- 0.068 (in 3 folds) ROC-AUC (macro OvO): 0.559 +/- 0.051 (in 3 folds) au-PRC (weighted OvO): 0.617 +/- 0.103 (in 3 folds) au-PRC (macro OvO): 0.608 +/- 0.095 (in 3 folds) Accuracy: 0.504 +/- 0.099 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.500 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.547 +/- 0.067 (in 2 folds) ROC-AUC (macro OvO): 0.544 +/- 0.063 (in 2 folds) au-PRC (weighted OvO): 0.578 +/- 0.110 (in 2 folds) au-PRC (macro OvO): 0.572 +/- 0.102 (in 2 folds) Accuracy: 0.478 +/- 0.054 (in 3 folds) MCC: 0.002 +/- 0.003 (in 3 folds) Unknown/abstention proportion: 0.128 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.478 MCC: -0.018 Unknown/abstention proportion: 0.043 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.00 0.00 0.00 22  Asian 0.00 0.00 0.00 30  Caucasian 0.50 0.95 0.65 58 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.48 115  macro avg 0.10 0.19 0.13 115  weighted avg 0.25 0.48 0.33 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.504 +/- 0.027 (in 3 folds) ROC-AUC (macro OvO): 0.501 +/- 0.025 (in 3 folds) au-PRC (weighted OvO): 0.515 +/- 0.017 (in 3 folds) au-PRC (macro OvO): 0.512 +/- 0.014 (in 3 folds) Accuracy: 0.424 +/- 0.042 (in 3 folds) MCC: 0.030 +/- 0.067 (in 3 folds) Global scores without abstention: Accuracy: 0.429 MCC: 0.038 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.392 +/- 0.096 (in 3 folds) MCC: 0.009 +/- 0.053 (in 3 folds) Unknown/abstention proportion: 0.256 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.494 +/- 0.031 (in 2 folds) ROC-AUC (macro OvO): 0.494 +/- 0.030 (in 2 folds) au-PRC (weighted OvO): 0.506 +/- 0.008 (in 2 folds) au-PRC (macro OvO): 0.504 +/- 0.008 (in 2 folds) Global scores with abstention: Accuracy: 0.391 MCC: 0.019 Unknown/abstention proportion: 0.087 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.09 0.05 0.06 22  Asian 0.33 0.27 0.30 30  Caucasian 0.51 0.62 0.56 58 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.39 115  macro avg 0.19 0.19 0.18 115  weighted avg 0.36 0.39 0.37 115
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 3 folds) Accuracy: 0.504 +/- 0.099 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.500 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 2 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 2 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 2 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 2 folds) Accuracy: 0.478 +/- 0.054 (in 3 folds) MCC: 0.002 +/- 0.003 (in 3 folds) Unknown/abstention proportion: 0.128 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.478 MCC: -0.018 Unknown/abstention proportion: 0.043 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.00 0.00 0.00 22  Asian 0.00 0.00 0.00 30  Caucasian 0.50 0.95 0.65 58 Hispanic/Latino 0.00 0.00 0.00 5  Unknown 0.00 0.00 0.00 0  accuracy 0.48 115  macro avg 0.10 0.19 0.13 115  weighted avg 0.25 0.48 0.33 115


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.671 +/- 0.043 (in 3 folds),0.676 +/- 0.028 (in 3 folds),0.706 +/- 0.049 (in 3 folds),0.703 +/- 0.055 (in 3 folds),0.674 +/- 0.078 (in 3 folds),0.395 +/- 0.083 (in 3 folds),0.677,0.394,0.670 +/- 0.082 (in 3 folds),0.391 +/- 0.091 (in 3 folds),0.018 +/- 0.000 (in 1 folds),0.681 +/- 0.056 (in 2 folds),0.688 +/- 0.027 (in 2 folds),0.722 +/- 0.057 (in 2 folds),0.724 +/- 0.059 (in 2 folds),0.673,0.389,0.006,Unknown,164.0,1.0,165.0,0.006061,True
lasso_multiclass.decision_thresholds_tuned,0.671 +/- 0.043 (in 3 folds),0.676 +/- 0.028 (in 3 folds),0.706 +/- 0.049 (in 3 folds),0.703 +/- 0.055 (in 3 folds),0.632 +/- 0.101 (in 3 folds),0.331 +/- 0.119 (in 3 folds),0.634,0.321,0.629 +/- 0.106 (in 3 folds),0.332 +/- 0.117 (in 3 folds),0.018 +/- 0.000 (in 1 folds),0.681 +/- 0.056 (in 2 folds),0.688 +/- 0.027 (in 2 folds),0.722 +/- 0.057 (in 2 folds),0.724 +/- 0.059 (in 2 folds),0.63,0.32,0.006,Unknown,164.0,1.0,165.0,0.006061,True
lasso_cv,0.635 +/- 0.047 (in 3 folds),0.673 +/- 0.041 (in 3 folds),0.676 +/- 0.041 (in 3 folds),0.693 +/- 0.040 (in 3 folds),0.666 +/- 0.018 (in 3 folds),0.292 +/- 0.257 (in 3 folds),0.667,0.375,0.632 +/- 0.068 (in 3 folds),0.222 +/- 0.263 (in 3 folds),0.080 +/- 0.089 (in 2 folds),0.651 +/- 0.000 (in 1 folds),0.644 +/- 0.000 (in 1 folds),0.703 +/- 0.000 (in 1 folds),0.688 +/- 0.000 (in 1 folds),0.63,0.284,0.055,Unknown,156.0,9.0,165.0,0.054545,True
lasso_cv.decision_thresholds_tuned,0.635 +/- 0.047 (in 3 folds),0.673 +/- 0.041 (in 3 folds),0.676 +/- 0.041 (in 3 folds),0.693 +/- 0.040 (in 3 folds),0.644 +/- 0.051 (in 3 folds),0.375 +/- 0.147 (in 3 folds),0.641,0.323,0.609 +/- 0.061 (in 3 folds),0.313 +/- 0.146 (in 3 folds),0.080 +/- 0.089 (in 2 folds),0.651 +/- 0.000 (in 1 folds),0.644 +/- 0.000 (in 1 folds),0.703 +/- 0.000 (in 1 folds),0.688 +/- 0.000 (in 1 folds),0.606,0.278,0.055,Unknown,156.0,9.0,165.0,0.054545,True
elasticnet_cv,0.629 +/- 0.034 (in 3 folds),0.636 +/- 0.034 (in 3 folds),0.675 +/- 0.019 (in 3 folds),0.671 +/- 0.009 (in 3 folds),0.635 +/- 0.050 (in 3 folds),0.227 +/- 0.203 (in 3 folds),0.637,0.285,0.604 +/- 0.066 (in 3 folds),0.171 +/- 0.152 (in 3 folds),0.143 +/- 0.000 (in 1 folds),0.627 +/- 0.048 (in 2 folds),0.624 +/- 0.040 (in 2 folds),0.682 +/- 0.021 (in 2 folds),0.672 +/- 0.013 (in 2 folds),0.606,0.203,0.048,Unknown,157.0,8.0,165.0,0.048485,True
elasticnet_cv.decision_thresholds_tuned,0.629 +/- 0.034 (in 3 folds),0.636 +/- 0.034 (in 3 folds),0.675 +/- 0.019 (in 3 folds),0.671 +/- 0.009 (in 3 folds),0.666 +/- 0.040 (in 3 folds),0.367 +/- 0.058 (in 3 folds),0.669,0.37,0.635 +/- 0.079 (in 3 folds),0.312 +/- 0.093 (in 3 folds),0.143 +/- 0.000 (in 1 folds),0.627 +/- 0.048 (in 2 folds),0.624 +/- 0.040 (in 2 folds),0.682 +/- 0.021 (in 2 folds),0.672 +/- 0.013 (in 2 folds),0.636,0.32,0.048,Unknown,157.0,8.0,165.0,0.048485,True
linearsvm_ovr,0.622 +/- 0.028 (in 3 folds),0.623 +/- 0.036 (in 3 folds),0.669 +/- 0.009 (in 3 folds),0.660 +/- 0.018 (in 3 folds),0.669 +/- 0.098 (in 3 folds),0.389 +/- 0.112 (in 3 folds),0.675,0.381,0.662 +/- 0.105 (in 3 folds),0.372 +/- 0.129 (in 3 folds),0.019 +/- 0.002 (in 2 folds),0.605 +/- 0.000 (in 1 folds),0.626 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds),0.671 +/- 0.000 (in 1 folds),0.667,0.362,0.012,Unknown,163.0,2.0,165.0,0.012121,True
linearsvm_ovr.decision_thresholds_tuned,0.622 +/- 0.028 (in 3 folds),0.623 +/- 0.036 (in 3 folds),0.669 +/- 0.009 (in 3 folds),0.660 +/- 0.018 (in 3 folds),0.635 +/- 0.068 (in 3 folds),0.334 +/- 0.067 (in 3 folds),0.638,0.304,0.628 +/- 0.074 (in 3 folds),0.318 +/- 0.062 (in 3 folds),0.019 +/- 0.002 (in 2 folds),0.605 +/- 0.000 (in 1 folds),0.626 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds),0.671 +/- 0.000 (in 1 folds),0.63,0.296,0.012,Unknown,163.0,2.0,165.0,0.012121,True
rf_multiclass,0.606 +/- 0.054 (in 3 folds),0.612 +/- 0.042 (in 3 folds),0.630 +/- 0.020 (in 3 folds),0.620 +/- 0.006 (in 3 folds),0.674 +/- 0.038 (in 3 folds),0.374 +/- 0.085 (in 3 folds),0.675,0.382,0.652 +/- 0.052 (in 3 folds),0.341 +/- 0.042 (in 3 folds),0.049 +/- 0.044 (in 2 folds),0.545 +/- 0.000 (in 1 folds),0.570 +/- 0.000 (in 1 folds),0.612 +/- 0.000 (in 1 folds),0.622 +/- 0.000 (in 1 folds),0.655,0.342,0.03,Unknown,160.0,5.0,165.0,0.030303,True
rf_multiclass.decision_thresholds_tuned,0.606 +/- 0.054 (in 3 folds),0.612 +/- 0.042 (in 3 folds),0.630 +/- 0.020 (in 3 folds),0.620 +/- 0.006 (in 3 folds),0.499 +/- 0.271 (in 3 folds),0.306 +/- 0.189 (in 3 folds),0.481,0.152,0.477 +/- 0.252 (in 3 folds),0.274 +/- 0.153 (in 3 folds),0.049 +/- 0.044 (in 2 folds),0.545 +/- 0.000 (in 1 folds),0.570 +/- 0.000 (in 1 folds),0.612 +/- 0.000 (in 1 folds),0.622 +/- 0.000 (in 1 folds),0.467,0.146,0.03,Unknown,160.0,5.0,165.0,0.030303,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.671 +/- 0.043 (in 3 folds),0.676 +/- 0.028 (in 3 folds),0.706 +/- 0.049 (in 3 folds),0.703 +/- 0.055 (in 3 folds),0.674 +/- 0.078 (in 3 folds),0.395 +/- 0.083 (in 3 folds),0.677,0.394,0.670 +/- 0.082 (in 3 folds),0.391 +/- 0.091 (in 3 folds),0.018 +/- 0.000 (in 1 folds),0.681 +/- 0.056 (in 2 folds),0.688 +/- 0.027 (in 2 folds),0.722 +/- 0.057 (in 2 folds),0.724 +/- 0.059 (in 2 folds),0.673,0.389,0.006,Unknown,164,1,165,0.006061,True
lasso_multiclass.decision_thresholds_tuned,0.671 +/- 0.043 (in 3 folds),0.676 +/- 0.028 (in 3 folds),0.706 +/- 0.049 (in 3 folds),0.703 +/- 0.055 (in 3 folds),0.632 +/- 0.101 (in 3 folds),0.331 +/- 0.119 (in 3 folds),0.634,0.321,0.629 +/- 0.106 (in 3 folds),0.332 +/- 0.117 (in 3 folds),0.018 +/- 0.000 (in 1 folds),0.681 +/- 0.056 (in 2 folds),0.688 +/- 0.027 (in 2 folds),0.722 +/- 0.057 (in 2 folds),0.724 +/- 0.059 (in 2 folds),0.63,0.32,0.006,Unknown,164,1,165,0.006061,True
lasso_cv,0.635 +/- 0.047 (in 3 folds),0.673 +/- 0.041 (in 3 folds),0.676 +/- 0.041 (in 3 folds),0.693 +/- 0.040 (in 3 folds),0.666 +/- 0.018 (in 3 folds),0.292 +/- 0.257 (in 3 folds),0.667,0.375,0.632 +/- 0.068 (in 3 folds),0.222 +/- 0.263 (in 3 folds),0.080 +/- 0.089 (in 2 folds),0.651 +/- 0.000 (in 1 folds),0.644 +/- 0.000 (in 1 folds),0.703 +/- 0.000 (in 1 folds),0.688 +/- 0.000 (in 1 folds),0.63,0.284,0.055,Unknown,156,9,165,0.054545,True
lasso_cv.decision_thresholds_tuned,0.635 +/- 0.047 (in 3 folds),0.673 +/- 0.041 (in 3 folds),0.676 +/- 0.041 (in 3 folds),0.693 +/- 0.040 (in 3 folds),0.644 +/- 0.051 (in 3 folds),0.375 +/- 0.147 (in 3 folds),0.641,0.323,0.609 +/- 0.061 (in 3 folds),0.313 +/- 0.146 (in 3 folds),0.080 +/- 0.089 (in 2 folds),0.651 +/- 0.000 (in 1 folds),0.644 +/- 0.000 (in 1 folds),0.703 +/- 0.000 (in 1 folds),0.688 +/- 0.000 (in 1 folds),0.606,0.278,0.055,Unknown,156,9,165,0.054545,True
elasticnet_cv,0.629 +/- 0.034 (in 3 folds),0.636 +/- 0.034 (in 3 folds),0.675 +/- 0.019 (in 3 folds),0.671 +/- 0.009 (in 3 folds),0.635 +/- 0.050 (in 3 folds),0.227 +/- 0.203 (in 3 folds),0.637,0.285,0.604 +/- 0.066 (in 3 folds),0.171 +/- 0.152 (in 3 folds),0.143 +/- 0.000 (in 1 folds),0.627 +/- 0.048 (in 2 folds),0.624 +/- 0.040 (in 2 folds),0.682 +/- 0.021 (in 2 folds),0.672 +/- 0.013 (in 2 folds),0.606,0.203,0.048,Unknown,157,8,165,0.048485,True
elasticnet_cv.decision_thresholds_tuned,0.629 +/- 0.034 (in 3 folds),0.636 +/- 0.034 (in 3 folds),0.675 +/- 0.019 (in 3 folds),0.671 +/- 0.009 (in 3 folds),0.666 +/- 0.040 (in 3 folds),0.367 +/- 0.058 (in 3 folds),0.669,0.37,0.635 +/- 0.079 (in 3 folds),0.312 +/- 0.093 (in 3 folds),0.143 +/- 0.000 (in 1 folds),0.627 +/- 0.048 (in 2 folds),0.624 +/- 0.040 (in 2 folds),0.682 +/- 0.021 (in 2 folds),0.672 +/- 0.013 (in 2 folds),0.636,0.32,0.048,Unknown,157,8,165,0.048485,True
linearsvm_ovr,0.622 +/- 0.028 (in 3 folds),0.623 +/- 0.036 (in 3 folds),0.669 +/- 0.009 (in 3 folds),0.660 +/- 0.018 (in 3 folds),0.669 +/- 0.098 (in 3 folds),0.389 +/- 0.112 (in 3 folds),0.675,0.381,0.662 +/- 0.105 (in 3 folds),0.372 +/- 0.129 (in 3 folds),0.019 +/- 0.002 (in 2 folds),0.605 +/- 0.000 (in 1 folds),0.626 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds),0.671 +/- 0.000 (in 1 folds),0.667,0.362,0.012,Unknown,163,2,165,0.012121,True
linearsvm_ovr.decision_thresholds_tuned,0.622 +/- 0.028 (in 3 folds),0.623 +/- 0.036 (in 3 folds),0.669 +/- 0.009 (in 3 folds),0.660 +/- 0.018 (in 3 folds),0.635 +/- 0.068 (in 3 folds),0.334 +/- 0.067 (in 3 folds),0.638,0.304,0.628 +/- 0.074 (in 3 folds),0.318 +/- 0.062 (in 3 folds),0.019 +/- 0.002 (in 2 folds),0.605 +/- 0.000 (in 1 folds),0.626 +/- 0.000 (in 1 folds),0.677 +/- 0.000 (in 1 folds),0.671 +/- 0.000 (in 1 folds),0.63,0.296,0.012,Unknown,163,2,165,0.012121,True
rf_multiclass,0.606 +/- 0.054 (in 3 folds),0.612 +/- 0.042 (in 3 folds),0.630 +/- 0.020 (in 3 folds),0.620 +/- 0.006 (in 3 folds),0.674 +/- 0.038 (in 3 folds),0.374 +/- 0.085 (in 3 folds),0.675,0.382,0.652 +/- 0.052 (in 3 folds),0.341 +/- 0.042 (in 3 folds),0.049 +/- 0.044 (in 2 folds),0.545 +/- 0.000 (in 1 folds),0.570 +/- 0.000 (in 1 folds),0.612 +/- 0.000 (in 1 folds),0.622 +/- 0.000 (in 1 folds),0.655,0.342,0.03,Unknown,160,5,165,0.030303,True
rf_multiclass.decision_thresholds_tuned,0.606 +/- 0.054 (in 3 folds),0.612 +/- 0.042 (in 3 folds),0.630 +/- 0.020 (in 3 folds),0.620 +/- 0.006 (in 3 folds),0.499 +/- 0.271 (in 3 folds),0.306 +/- 0.189 (in 3 folds),0.481,0.152,0.477 +/- 0.252 (in 3 folds),0.274 +/- 0.153 (in 3 folds),0.049 +/- 0.044 (in 2 folds),0.545 +/- 0.000 (in 1 folds),0.570 +/- 0.000 (in 1 folds),0.612 +/- 0.000 (in 1 folds),0.622 +/- 0.000 (in 1 folds),0.467,0.146,0.03,Unknown,160,5,165,0.030303,False


lasso_multiclass,lasso_multiclass.decision_thresholds_tuned,lasso_cv,lasso_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.671 +/- 0.043 (in 3 folds) ROC-AUC (macro OvO): 0.676 +/- 0.028 (in 3 folds) au-PRC (weighted OvO): 0.706 +/- 0.049 (in 3 folds) au-PRC (macro OvO): 0.703 +/- 0.055 (in 3 folds) Accuracy: 0.674 +/- 0.078 (in 3 folds) MCC: 0.395 +/- 0.083 (in 3 folds) Global scores without abstention: Accuracy: 0.677 MCC: 0.394 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.670 +/- 0.082 (in 3 folds) MCC: 0.391 +/- 0.091 (in 3 folds) Unknown/abstention proportion: 0.018 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.681 +/- 0.056 (in 2 folds) ROC-AUC (macro OvO): 0.688 +/- 0.027 (in 2 folds) au-PRC (weighted OvO): 0.722 +/- 0.057 (in 2 folds) au-PRC (macro OvO): 0.724 +/- 0.059 (in 2 folds) Global scores with abstention: Accuracy: 0.673 MCC: 0.389 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.43 0.60 30  Asian 0.50 0.03 0.06 32  Caucasian 0.65 1.00 0.79 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.67 165  macro avg 0.43 0.29 0.29 165  weighted avg 0.66 0.67 0.58 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.671 +/- 0.043 (in 3 folds) ROC-AUC (macro OvO): 0.676 +/- 0.028 (in 3 folds) au-PRC (weighted OvO): 0.706 +/- 0.049 (in 3 folds) au-PRC (macro OvO): 0.703 +/- 0.055 (in 3 folds) Accuracy: 0.632 +/- 0.101 (in 3 folds) MCC: 0.331 +/- 0.119 (in 3 folds) Global scores without abstention: Accuracy: 0.634 MCC: 0.321 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.629 +/- 0.106 (in 3 folds) MCC: 0.332 +/- 0.117 (in 3 folds) Unknown/abstention proportion: 0.018 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.681 +/- 0.056 (in 2 folds) ROC-AUC (macro OvO): 0.688 +/- 0.027 (in 2 folds) au-PRC (weighted OvO): 0.722 +/- 0.057 (in 2 folds) au-PRC (macro OvO): 0.724 +/- 0.059 (in 2 folds) Global scores with abstention: Accuracy: 0.630 MCC: 0.320 Unknown/abstention proportion: 0.006 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.69 0.73 0.71 30  Asian 0.22 0.12 0.16 32  Caucasian 0.68 0.80 0.74 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.63 165  macro avg 0.32 0.33 0.32 165  weighted avg 0.57 0.63 0.59 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.635 +/- 0.047 (in 3 folds) ROC-AUC (macro OvO): 0.673 +/- 0.041 (in 3 folds) au-PRC (weighted OvO): 0.676 +/- 0.041 (in 3 folds) au-PRC (macro OvO): 0.693 +/- 0.040 (in 3 folds) Accuracy: 0.666 +/- 0.018 (in 3 folds) MCC: 0.292 +/- 0.257 (in 3 folds) Global scores without abstention: Accuracy: 0.667 MCC: 0.375 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.632 +/- 0.068 (in 3 folds) MCC: 0.222 +/- 0.263 (in 3 folds) Unknown/abstention proportion: 0.080 +/- 0.089 (in 2 folds) ROC-AUC (weighted OvO): 0.651 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.644 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.703 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.688 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.630 MCC: 0.284 Unknown/abstention proportion: 0.055 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.92 0.37 0.52 30  Asian 1.00 0.03 0.06 32  Caucasian 0.64 0.95 0.77 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.63 165  macro avg 0.51 0.27 0.27 165  weighted avg 0.74 0.63 0.56 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.635 +/- 0.047 (in 3 folds) ROC-AUC (macro OvO): 0.673 +/- 0.041 (in 3 folds) au-PRC (weighted OvO): 0.676 +/- 0.041 (in 3 folds) au-PRC (macro OvO): 0.693 +/- 0.040 (in 3 folds) Accuracy: 0.644 +/- 0.051 (in 3 folds) MCC: 0.375 +/- 0.147 (in 3 folds) Global scores without abstention: Accuracy: 0.641 MCC: 0.323 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.609 +/- 0.061 (in 3 folds) MCC: 0.313 +/- 0.146 (in 3 folds) Unknown/abstention proportion: 0.080 +/- 0.089 (in 2 folds) ROC-AUC (weighted OvO): 0.651 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.644 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.703 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.688 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.606 MCC: 0.278 Unknown/abstention proportion: 0.055 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.64 0.70 0.67 30  Asian 0.00 0.00 0.00 32  Caucasian 0.66 0.81 0.73 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.61 165  macro avg 0.26 0.30 0.28 165  weighted avg 0.50 0.61 0.55 165
,,,


elasticnet_cv,elasticnet_cv.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.629 +/- 0.034 (in 3 folds) ROC-AUC (macro OvO): 0.636 +/- 0.034 (in 3 folds) au-PRC (weighted OvO): 0.675 +/- 0.019 (in 3 folds) au-PRC (macro OvO): 0.671 +/- 0.009 (in 3 folds) Accuracy: 0.635 +/- 0.050 (in 3 folds) MCC: 0.227 +/- 0.203 (in 3 folds) Global scores without abstention: Accuracy: 0.637 MCC: 0.285 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.604 +/- 0.066 (in 3 folds) MCC: 0.171 +/- 0.152 (in 3 folds) Unknown/abstention proportion: 0.143 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.627 +/- 0.048 (in 2 folds) ROC-AUC (macro OvO): 0.624 +/- 0.040 (in 2 folds) au-PRC (weighted OvO): 0.682 +/- 0.021 (in 2 folds) au-PRC (macro OvO): 0.672 +/- 0.013 (in 2 folds) Global scores with abstention: Accuracy: 0.606 MCC: 0.203 Unknown/abstention proportion: 0.048 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.20 0.33 30  Asian 1.00 0.03 0.06 32  Caucasian 0.62 0.96 0.75 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.61 165  macro avg 0.52 0.24 0.23 165  weighted avg 0.74 0.61 0.52 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.629 +/- 0.034 (in 3 folds) ROC-AUC (macro OvO): 0.636 +/- 0.034 (in 3 folds) au-PRC (weighted OvO): 0.675 +/- 0.019 (in 3 folds) au-PRC (macro OvO): 0.671 +/- 0.009 (in 3 folds) Accuracy: 0.666 +/- 0.040 (in 3 folds) MCC: 0.367 +/- 0.058 (in 3 folds) Global scores without abstention: Accuracy: 0.669 MCC: 0.370 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.635 +/- 0.079 (in 3 folds) MCC: 0.312 +/- 0.093 (in 3 folds) Unknown/abstention proportion: 0.143 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.627 +/- 0.048 (in 2 folds) ROC-AUC (macro OvO): 0.624 +/- 0.040 (in 2 folds) au-PRC (weighted OvO): 0.682 +/- 0.021 (in 2 folds) au-PRC (macro OvO): 0.672 +/- 0.013 (in 2 folds) Global scores with abstention: Accuracy: 0.636 MCC: 0.320 Unknown/abstention proportion: 0.048 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.64 0.60 0.62 30  Asian 0.00 0.00 0.00 32  Caucasian 0.67 0.90 0.77 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.64 165  macro avg 0.26 0.30 0.28 165  weighted avg 0.51 0.64 0.57 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.622 +/- 0.028 (in 3 folds) ROC-AUC (macro OvO): 0.623 +/- 0.036 (in 3 folds) au-PRC (weighted OvO): 0.669 +/- 0.009 (in 3 folds) au-PRC (macro OvO): 0.660 +/- 0.018 (in 3 folds) Accuracy: 0.669 +/- 0.098 (in 3 folds) MCC: 0.389 +/- 0.112 (in 3 folds) Global scores without abstention: Accuracy: 0.675 MCC: 0.381 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.662 +/- 0.105 (in 3 folds) MCC: 0.372 +/- 0.129 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.002 (in 2 folds) ROC-AUC (weighted OvO): 0.605 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.626 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.677 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.671 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.667 MCC: 0.362 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 1.00 0.50 0.67 30  Asian 0.25 0.03 0.06 32  Caucasian 0.65 0.97 0.78 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.67 165  macro avg 0.38 0.30 0.30 165  weighted avg 0.61 0.67 0.59 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.622 +/- 0.028 (in 3 folds) ROC-AUC (macro OvO): 0.623 +/- 0.036 (in 3 folds) au-PRC (weighted OvO): 0.669 +/- 0.009 (in 3 folds) au-PRC (macro OvO): 0.660 +/- 0.018 (in 3 folds) Accuracy: 0.635 +/- 0.068 (in 3 folds) MCC: 0.334 +/- 0.067 (in 3 folds) Global scores without abstention: Accuracy: 0.638 MCC: 0.304 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.628 +/- 0.074 (in 3 folds) MCC: 0.318 +/- 0.062 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.002 (in 2 folds) ROC-AUC (weighted OvO): 0.605 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.626 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.677 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.671 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.630 MCC: 0.296 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.72 0.60 0.65 30  Asian 0.23 0.09 0.13 32  Caucasian 0.66 0.86 0.75 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.63 165  macro avg 0.32 0.31 0.31 165  weighted avg 0.57 0.63 0.58 165
,,,


rf_multiclass,rf_multiclass.decision_thresholds_tuned,ridge_cv,ridge_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.606 +/- 0.054 (in 3 folds) ROC-AUC (macro OvO): 0.612 +/- 0.042 (in 3 folds) au-PRC (weighted OvO): 0.630 +/- 0.020 (in 3 folds) au-PRC (macro OvO): 0.620 +/- 0.006 (in 3 folds) Accuracy: 0.674 +/- 0.038 (in 3 folds) MCC: 0.374 +/- 0.085 (in 3 folds) Global scores without abstention: Accuracy: 0.675 MCC: 0.382 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.652 +/- 0.052 (in 3 folds) MCC: 0.341 +/- 0.042 (in 3 folds) Unknown/abstention proportion: 0.049 +/- 0.044 (in 2 folds) ROC-AUC (weighted OvO): 0.545 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.570 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.612 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.622 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.655 MCC: 0.342 Unknown/abstention proportion: 0.030 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.77 0.57 0.65 30  Asian 0.50 0.03 0.06 32  Caucasian 0.66 0.93 0.77 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.65 165  macro avg 0.39 0.31 0.30 165  weighted avg 0.63 0.65 0.58 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.606 +/- 0.054 (in 3 folds) ROC-AUC (macro OvO): 0.612 +/- 0.042 (in 3 folds) au-PRC (weighted OvO): 0.630 +/- 0.020 (in 3 folds) au-PRC (macro OvO): 0.620 +/- 0.006 (in 3 folds) Accuracy: 0.499 +/- 0.271 (in 3 folds) MCC: 0.306 +/- 0.189 (in 3 folds) Global scores without abstention: Accuracy: 0.481 MCC: 0.152 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.477 +/- 0.252 (in 3 folds) MCC: 0.274 +/- 0.153 (in 3 folds) Unknown/abstention proportion: 0.049 +/- 0.044 (in 2 folds) ROC-AUC (weighted OvO): 0.545 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.570 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.612 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.622 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.467 MCC: 0.146 Unknown/abstention proportion: 0.030 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.45 0.60 0.51 30  Asian 0.23 0.22 0.23 32  Caucasian 0.63 0.54 0.58 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.47 165  macro avg 0.26 0.27 0.26 165  weighted avg 0.50 0.47 0.48 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.584 +/- 0.074 (in 3 folds) ROC-AUC (macro OvO): 0.594 +/- 0.082 (in 3 folds) au-PRC (weighted OvO): 0.617 +/- 0.102 (in 3 folds) au-PRC (macro OvO): 0.624 +/- 0.112 (in 3 folds) Accuracy: 0.581 +/- 0.090 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.588 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.564 +/- 0.109 (in 3 folds) MCC: 0.002 +/- 0.064 (in 3 folds) Unknown/abstention proportion: 0.049 +/- 0.044 (in 2 folds) ROC-AUC (weighted OvO): 0.618 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.654 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.673 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.719 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.570 MCC: -0.002 Unknown/abstention proportion: 0.030 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.00 0.00 0.00 30  Asian 0.00 0.00 0.00 32  Caucasian 0.59 0.97 0.73 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.57 165  macro avg 0.12 0.19 0.15 165  weighted avg 0.35 0.57 0.43 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.584 +/- 0.074 (in 3 folds) ROC-AUC (macro OvO): 0.594 +/- 0.082 (in 3 folds) au-PRC (weighted OvO): 0.617 +/- 0.102 (in 3 folds) au-PRC (macro OvO): 0.624 +/- 0.112 (in 3 folds) Accuracy: 0.504 +/- 0.279 (in 3 folds) MCC: 0.146 +/- 0.254 (in 3 folds) Global scores without abstention: Accuracy: 0.500 MCC: 0.146 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.486 +/- 0.269 (in 3 folds) MCC: 0.080 +/- 0.229 (in 3 folds) Unknown/abstention proportion: 0.049 +/- 0.044 (in 2 folds) ROC-AUC (weighted OvO): 0.618 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.654 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.673 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.719 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.485 MCC: 0.137 Unknown/abstention proportion: 0.030 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.28 0.60 0.38 30  Asian 0.00 0.00 0.00 32  Caucasian 0.65 0.64 0.65 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.48 165  macro avg 0.19 0.25 0.20 165  weighted avg 0.43 0.48 0.45 165
,,,


xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.567 +/- 0.075 (in 3 folds) ROC-AUC (macro OvO): 0.567 +/- 0.064 (in 3 folds) au-PRC (weighted OvO): 0.632 +/- 0.039 (in 3 folds) au-PRC (macro OvO): 0.629 +/- 0.013 (in 3 folds) Accuracy: 0.596 +/- 0.099 (in 3 folds) MCC: 0.270 +/- 0.239 (in 3 folds) Global scores without abstention: Accuracy: 0.591 MCC: 0.216 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.572 +/- 0.087 (in 3 folds) MCC: 0.235 +/- 0.213 (in 3 folds) Unknown/abstention proportion: 0.038 +/- 0.036 (in 3 folds) Global scores with abstention: Accuracy: 0.570 MCC: 0.195 Unknown/abstention proportion: 0.036 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.65 0.57 0.61 30  Asian 0.10 0.03 0.05 32  Caucasian 0.63 0.78 0.70 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.57 165  macro avg 0.28 0.28 0.27 165  weighted avg 0.51 0.57 0.53 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.567 +/- 0.075 (in 3 folds) ROC-AUC (macro OvO): 0.567 +/- 0.064 (in 3 folds) au-PRC (weighted OvO): 0.632 +/- 0.039 (in 3 folds) au-PRC (macro OvO): 0.629 +/- 0.013 (in 3 folds) Accuracy: 0.622 +/- 0.093 (in 3 folds) MCC: 0.293 +/- 0.296 (in 3 folds) Global scores without abstention: Accuracy: 0.616 MCC: 0.258 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.597 +/- 0.077 (in 3 folds) MCC: 0.247 +/- 0.254 (in 3 folds) Unknown/abstention proportion: 0.038 +/- 0.036 (in 3 folds) Global scores with abstention: Accuracy: 0.594 MCC: 0.228 Unknown/abstention proportion: 0.036 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  African 0.83 0.50 0.62 30  Asian 0.17 0.03 0.05 32  Caucasian 0.64 0.85 0.73 97 Hispanic/Latino 0.00 0.00 0.00 6  Unknown 0.00 0.00 0.00 0  accuracy 0.59 165  macro avg 0.33 0.28 0.28 165  weighted avg 0.56 0.59 0.55 165
,


---

# GeneLocus.TCR, TargetObsColumnEnum.age_group_healthy_only trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.624 +/- 0.021 (in 3 folds),0.604 +/- 0.014 (in 3 folds),0.691 +/- 0.012 (in 3 folds),0.675 +/- 0.013 (in 3 folds),0.324 +/- 0.035 (in 3 folds),0.250 +/- 0.044 (in 3 folds),0.325,0.194,0.322 +/- 0.039 (in 3 folds),0.248 +/- 0.043 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.632 +/- 0.021 (in 2 folds),0.612 +/- 0.000 (in 2 folds),0.697 +/- 0.006 (in 2 folds),0.680 +/- 0.013 (in 2 folds),0.322,0.193,0.009,Unknown,114.0,1.0,115.0,0.008696,True
lasso_cv,0.619 +/- 0.035 (in 3 folds),0.604 +/- 0.031 (in 3 folds),0.692 +/- 0.014 (in 3 folds),0.681 +/- 0.011 (in 3 folds),0.298 +/- 0.053 (in 3 folds),0.253 +/- 0.029 (in 3 folds),0.298,0.184,0.296 +/- 0.057 (in 3 folds),0.249 +/- 0.034 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.624 +/- 0.048 (in 2 folds),0.610 +/- 0.041 (in 2 folds),0.694 +/- 0.020 (in 2 folds),0.684 +/- 0.013 (in 2 folds),0.296,0.183,0.009,Unknown,114.0,1.0,115.0,0.008696,True
rf_multiclass,0.615 +/- 0.026 (in 3 folds),0.598 +/- 0.030 (in 3 folds),0.657 +/- 0.011 (in 3 folds),0.644 +/- 0.015 (in 3 folds),0.324 +/- 0.009 (in 3 folds),0.230 +/- 0.005 (in 3 folds),0.325,0.18,0.322 +/- 0.013 (in 3 folds),0.228 +/- 0.006 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.629 +/- 0.012 (in 2 folds),0.611 +/- 0.027 (in 2 folds),0.663 +/- 0.006 (in 2 folds),0.650 +/- 0.016 (in 2 folds),0.322,0.179,0.009,Unknown,114.0,1.0,115.0,0.008696,True
xgboost,0.606 +/- 0.062 (in 3 folds),0.581 +/- 0.065 (in 3 folds),0.660 +/- 0.051 (in 3 folds),0.646 +/- 0.060 (in 3 folds),0.357 +/- 0.035 (in 3 folds),0.228 +/- 0.062 (in 3 folds),0.355,0.217,0.331 +/- 0.022 (in 3 folds),0.206 +/- 0.035 (in 3 folds),0.103 +/- 0.073 (in 2 folds),0.655 +/- 0.000 (in 1 folds),0.647 +/- 0.000 (in 1 folds),0.715 +/- 0.000 (in 1 folds),0.713 +/- 0.000 (in 1 folds),0.33,0.2,0.07,Unknown,107.0,8.0,115.0,0.069565,True
linearsvm_ovr,0.604 +/- 0.010 (in 3 folds),0.580 +/- 0.022 (in 3 folds),0.664 +/- 0.031 (in 3 folds),0.646 +/- 0.040 (in 3 folds),0.355 +/- 0.040 (in 3 folds),0.240 +/- 0.050 (in 3 folds),0.355,0.213,0.339 +/- 0.018 (in 3 folds),0.226 +/- 0.036 (in 3 folds),0.064 +/- 0.054 (in 2 folds),0.602 +/- 0.000 (in 1 folds),0.587 +/- 0.000 (in 1 folds),0.678 +/- 0.000 (in 1 folds),0.666 +/- 0.000 (in 1 folds),0.339,0.204,0.043,Unknown,110.0,5.0,115.0,0.043478,True
ridge_cv,0.599 +/- 0.056 (in 3 folds),0.570 +/- 0.044 (in 3 folds),0.659 +/- 0.017 (in 3 folds),0.639 +/- 0.015 (in 3 folds),0.253 +/- 0.061 (in 3 folds),0.109 +/- 0.116 (in 3 folds),0.25,0.077,0.235 +/- 0.049 (in 3 folds),0.138 +/- 0.082 (in 3 folds),0.090 +/- 0.091 (in 2 folds),0.541 +/- 0.000 (in 1 folds),0.521 +/- 0.000 (in 1 folds),0.640 +/- 0.000 (in 1 folds),0.625 +/- 0.000 (in 1 folds),0.235,0.078,0.061,Unknown,108.0,7.0,115.0,0.06087,True
elasticnet_cv,0.598 +/- 0.010 (in 3 folds),0.580 +/- 0.015 (in 3 folds),0.661 +/- 0.023 (in 3 folds),0.648 +/- 0.028 (in 3 folds),0.281 +/- 0.084 (in 3 folds),0.248 +/- 0.092 (in 3 folds),0.281,0.147,0.279 +/- 0.086 (in 3 folds),0.246 +/- 0.096 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.594 +/- 0.009 (in 2 folds),0.573 +/- 0.011 (in 2 folds),0.648 +/- 0.006 (in 2 folds),0.632 +/- 0.008 (in 2 folds),0.278,0.144,0.009,Unknown,114.0,1.0,115.0,0.008696,True
dummy_stratified,0.526 +/- 0.011 (in 3 folds),0.527 +/- 0.009 (in 3 folds),0.539 +/- 0.005 (in 3 folds),0.540 +/- 0.004 (in 3 folds),0.213 +/- 0.028 (in 3 folds),0.054 +/- 0.033 (in 3 folds),0.212,0.047,0.209 +/- 0.032 (in 3 folds),0.056 +/- 0.031 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.528 +/- 0.014 (in 2 folds),0.526 +/- 0.012 (in 2 folds),0.540 +/- 0.006 (in 2 folds),0.538 +/- 0.004 (in 2 folds),0.209,0.048,0.017,Unknown,113.0,2.0,115.0,0.017391,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.229 +/- 0.064 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.226,0.035,0.208 +/- 0.042 (in 3 folds),0.042 +/- 0.043 (in 3 folds),0.115 +/- 0.054 (in 2 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.209,0.032,0.078,Unknown,106.0,9.0,115.0,0.078261,True
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.624 +/- 0.021 (in 3 folds),0.604 +/- 0.014 (in 3 folds),0.691 +/- 0.012 (in 3 folds),0.675 +/- 0.013 (in 3 folds),0.324 +/- 0.035 (in 3 folds),0.250 +/- 0.044 (in 3 folds),0.325,0.194,0.322 +/- 0.039 (in 3 folds),0.248 +/- 0.043 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.632 +/- 0.021 (in 2 folds),0.612 +/- 0.000 (in 2 folds),0.697 +/- 0.006 (in 2 folds),0.680 +/- 0.013 (in 2 folds),0.322,0.193,0.009,Unknown,114,1,115,0.008696,True
lasso_cv,0.619 +/- 0.035 (in 3 folds),0.604 +/- 0.031 (in 3 folds),0.692 +/- 0.014 (in 3 folds),0.681 +/- 0.011 (in 3 folds),0.298 +/- 0.053 (in 3 folds),0.253 +/- 0.029 (in 3 folds),0.298,0.184,0.296 +/- 0.057 (in 3 folds),0.249 +/- 0.034 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.624 +/- 0.048 (in 2 folds),0.610 +/- 0.041 (in 2 folds),0.694 +/- 0.020 (in 2 folds),0.684 +/- 0.013 (in 2 folds),0.296,0.183,0.009,Unknown,114,1,115,0.008696,True
rf_multiclass,0.615 +/- 0.026 (in 3 folds),0.598 +/- 0.030 (in 3 folds),0.657 +/- 0.011 (in 3 folds),0.644 +/- 0.015 (in 3 folds),0.324 +/- 0.009 (in 3 folds),0.230 +/- 0.005 (in 3 folds),0.325,0.18,0.322 +/- 0.013 (in 3 folds),0.228 +/- 0.006 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.629 +/- 0.012 (in 2 folds),0.611 +/- 0.027 (in 2 folds),0.663 +/- 0.006 (in 2 folds),0.650 +/- 0.016 (in 2 folds),0.322,0.179,0.009,Unknown,114,1,115,0.008696,True
xgboost,0.606 +/- 0.062 (in 3 folds),0.581 +/- 0.065 (in 3 folds),0.660 +/- 0.051 (in 3 folds),0.646 +/- 0.060 (in 3 folds),0.357 +/- 0.035 (in 3 folds),0.228 +/- 0.062 (in 3 folds),0.355,0.217,0.331 +/- 0.022 (in 3 folds),0.206 +/- 0.035 (in 3 folds),0.103 +/- 0.073 (in 2 folds),0.655 +/- 0.000 (in 1 folds),0.647 +/- 0.000 (in 1 folds),0.715 +/- 0.000 (in 1 folds),0.713 +/- 0.000 (in 1 folds),0.33,0.2,0.07,Unknown,107,8,115,0.069565,True
linearsvm_ovr,0.604 +/- 0.010 (in 3 folds),0.580 +/- 0.022 (in 3 folds),0.664 +/- 0.031 (in 3 folds),0.646 +/- 0.040 (in 3 folds),0.355 +/- 0.040 (in 3 folds),0.240 +/- 0.050 (in 3 folds),0.355,0.213,0.339 +/- 0.018 (in 3 folds),0.226 +/- 0.036 (in 3 folds),0.064 +/- 0.054 (in 2 folds),0.602 +/- 0.000 (in 1 folds),0.587 +/- 0.000 (in 1 folds),0.678 +/- 0.000 (in 1 folds),0.666 +/- 0.000 (in 1 folds),0.339,0.204,0.043,Unknown,110,5,115,0.043478,True
ridge_cv,0.599 +/- 0.056 (in 3 folds),0.570 +/- 0.044 (in 3 folds),0.659 +/- 0.017 (in 3 folds),0.639 +/- 0.015 (in 3 folds),0.253 +/- 0.061 (in 3 folds),0.109 +/- 0.116 (in 3 folds),0.25,0.077,0.235 +/- 0.049 (in 3 folds),0.138 +/- 0.082 (in 3 folds),0.090 +/- 0.091 (in 2 folds),0.541 +/- 0.000 (in 1 folds),0.521 +/- 0.000 (in 1 folds),0.640 +/- 0.000 (in 1 folds),0.625 +/- 0.000 (in 1 folds),0.235,0.078,0.061,Unknown,108,7,115,0.06087,True
elasticnet_cv,0.598 +/- 0.010 (in 3 folds),0.580 +/- 0.015 (in 3 folds),0.661 +/- 0.023 (in 3 folds),0.648 +/- 0.028 (in 3 folds),0.281 +/- 0.084 (in 3 folds),0.248 +/- 0.092 (in 3 folds),0.281,0.147,0.279 +/- 0.086 (in 3 folds),0.246 +/- 0.096 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.594 +/- 0.009 (in 2 folds),0.573 +/- 0.011 (in 2 folds),0.648 +/- 0.006 (in 2 folds),0.632 +/- 0.008 (in 2 folds),0.278,0.144,0.009,Unknown,114,1,115,0.008696,True
dummy_stratified,0.526 +/- 0.011 (in 3 folds),0.527 +/- 0.009 (in 3 folds),0.539 +/- 0.005 (in 3 folds),0.540 +/- 0.004 (in 3 folds),0.213 +/- 0.028 (in 3 folds),0.054 +/- 0.033 (in 3 folds),0.212,0.047,0.209 +/- 0.032 (in 3 folds),0.056 +/- 0.031 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.528 +/- 0.014 (in 2 folds),0.526 +/- 0.012 (in 2 folds),0.540 +/- 0.006 (in 2 folds),0.538 +/- 0.004 (in 2 folds),0.209,0.048,0.017,Unknown,113,2,115,0.017391,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.229 +/- 0.064 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.226,0.035,0.208 +/- 0.042 (in 3 folds),0.042 +/- 0.043 (in 3 folds),0.115 +/- 0.054 (in 2 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.209,0.032,0.078,Unknown,106,9,115,0.078261,True


lasso_multiclass,lasso_cv,rf_multiclass,xgboost
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.624 +/- 0.021 (in 3 folds) ROC-AUC (macro OvO): 0.604 +/- 0.014 (in 3 folds) au-PRC (weighted OvO): 0.691 +/- 0.012 (in 3 folds) au-PRC (macro OvO): 0.675 +/- 0.013 (in 3 folds) Accuracy: 0.324 +/- 0.035 (in 3 folds) MCC: 0.250 +/- 0.044 (in 3 folds) Global scores without abstention: Accuracy: 0.325 MCC: 0.194 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.322 +/- 0.039 (in 3 folds) MCC: 0.248 +/- 0.043 (in 3 folds) Unknown/abstention proportion: 0.026 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.632 +/- 0.021 (in 2 folds) ROC-AUC (macro OvO): 0.612 +/- 0.000 (in 2 folds) au-PRC (weighted OvO): 0.697 +/- 0.006 (in 2 folds) au-PRC (macro OvO): 0.680 +/- 0.013 (in 2 folds) Global scores with abstention: Accuracy: 0.322 MCC: 0.193 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.44 0.32 0.37 22  30-40 0.06 0.07 0.06 14  40-50 0.10 0.07 0.08 15  50-60 0.33 0.35 0.34 23  60-70 0.17 0.33 0.23 15  70-80 0.00 0.00 0.00 2  <20 0.88 0.62 0.73 24  Unknown 0.00 0.00 0.00 0  accuracy 0.32 115  macro avg 0.25 0.22 0.23 115 weighted avg 0.38 0.32 0.34 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.619 +/- 0.035 (in 3 folds) ROC-AUC (macro OvO): 0.604 +/- 0.031 (in 3 folds) au-PRC (weighted OvO): 0.692 +/- 0.014 (in 3 folds) au-PRC (macro OvO): 0.681 +/- 0.011 (in 3 folds) Accuracy: 0.298 +/- 0.053 (in 3 folds) MCC: 0.253 +/- 0.029 (in 3 folds) Global scores without abstention: Accuracy: 0.298 MCC: 0.184 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.296 +/- 0.057 (in 3 folds) MCC: 0.249 +/- 0.034 (in 3 folds) Unknown/abstention proportion: 0.026 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.624 +/- 0.048 (in 2 folds) ROC-AUC (macro OvO): 0.610 +/- 0.041 (in 2 folds) au-PRC (weighted OvO): 0.694 +/- 0.020 (in 2 folds) au-PRC (macro OvO): 0.684 +/- 0.013 (in 2 folds) Global scores with abstention: Accuracy: 0.296 MCC: 0.183 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.60 0.14 0.22 22  30-40 0.00 0.00 0.00 14  40-50 0.14 0.07 0.09 15  50-60 0.23 0.30 0.26 23  60-70 0.18 0.67 0.28 15  70-80 0.00 0.00 0.00 2  <20 0.93 0.54 0.68 24  Unknown 0.00 0.00 0.00 0  accuracy 0.30 115  macro avg 0.26 0.21 0.19 115 weighted avg 0.40 0.30 0.29 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.615 +/- 0.026 (in 3 folds) ROC-AUC (macro OvO): 0.598 +/- 0.030 (in 3 folds) au-PRC (weighted OvO): 0.657 +/- 0.011 (in 3 folds) au-PRC (macro OvO): 0.644 +/- 0.015 (in 3 folds) Accuracy: 0.324 +/- 0.009 (in 3 folds) MCC: 0.230 +/- 0.005 (in 3 folds) Global scores without abstention: Accuracy: 0.325 MCC: 0.180 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.322 +/- 0.013 (in 3 folds) MCC: 0.228 +/- 0.006 (in 3 folds) Unknown/abstention proportion: 0.026 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.629 +/- 0.012 (in 2 folds) ROC-AUC (macro OvO): 0.611 +/- 0.027 (in 2 folds) au-PRC (weighted OvO): 0.663 +/- 0.006 (in 2 folds) au-PRC (macro OvO): 0.650 +/- 0.016 (in 2 folds) Global scores with abstention: Accuracy: 0.322 MCC: 0.179 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.26 0.41 0.32 22  30-40 0.00 0.00 0.00 14  40-50 0.25 0.07 0.11 15  50-60 0.26 0.35 0.30 23  60-70 0.15 0.20 0.17 15  70-80 0.00 0.00 0.00 2  <20 0.94 0.67 0.78 24  Unknown 0.00 0.00 0.00 0  accuracy 0.32 115  macro avg 0.23 0.21 0.21 115 weighted avg 0.35 0.32 0.32 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.606 +/- 0.062 (in 3 folds) ROC-AUC (macro OvO): 0.581 +/- 0.065 (in 3 folds) au-PRC (weighted OvO): 0.660 +/- 0.051 (in 3 folds) au-PRC (macro OvO): 0.646 +/- 0.060 (in 3 folds) Accuracy: 0.357 +/- 0.035 (in 3 folds) MCC: 0.228 +/- 0.062 (in 3 folds) Global scores without abstention: Accuracy: 0.355 MCC: 0.217 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.331 +/- 0.022 (in 3 folds) MCC: 0.206 +/- 0.035 (in 3 folds) Unknown/abstention proportion: 0.103 +/- 0.073 (in 2 folds) ROC-AUC (weighted OvO): 0.655 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.647 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.715 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.713 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.330 MCC: 0.200 Unknown/abstention proportion: 0.070 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.24 0.27 0.26 22  30-40 0.11 0.07 0.09 14  40-50 0.00 0.00 0.00 15  50-60 0.30 0.43 0.36 23  60-70 0.31 0.27 0.29 15  70-80 0.00 0.00 0.00 2  <20 0.94 0.71 0.81 24  Unknown 0.00 0.00 0.00 0  accuracy 0.33 115  macro avg 0.24 0.22 0.22 115 weighted avg 0.36 0.33 0.34 115
,,,


linearsvm_ovr,ridge_cv,elasticnet_cv,dummy_stratified
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.604 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.580 +/- 0.022 (in 3 folds) au-PRC (weighted OvO): 0.664 +/- 0.031 (in 3 folds) au-PRC (macro OvO): 0.646 +/- 0.040 (in 3 folds) Accuracy: 0.355 +/- 0.040 (in 3 folds) MCC: 0.240 +/- 0.050 (in 3 folds) Global scores without abstention: Accuracy: 0.355 MCC: 0.213 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.339 +/- 0.018 (in 3 folds) MCC: 0.226 +/- 0.036 (in 3 folds) Unknown/abstention proportion: 0.064 +/- 0.054 (in 2 folds) ROC-AUC (weighted OvO): 0.602 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.587 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.678 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.666 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.339 MCC: 0.204 Unknown/abstention proportion: 0.043 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.41 0.50 0.45 22  30-40 0.00 0.00 0.00 14  40-50 0.00 0.00 0.00 15  50-60 0.27 0.30 0.29 23  60-70 0.10 0.13 0.11 15  70-80 0.00 0.00 0.00 2  <20 0.70 0.79 0.75 24  Unknown 0.00 0.00 0.00 0  accuracy 0.34 115  macro avg 0.19 0.22 0.20 115 weighted avg 0.29 0.34 0.31 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.599 +/- 0.056 (in 3 folds) ROC-AUC (macro OvO): 0.570 +/- 0.044 (in 3 folds) au-PRC (weighted OvO): 0.659 +/- 0.017 (in 3 folds) au-PRC (macro OvO): 0.639 +/- 0.015 (in 3 folds) Accuracy: 0.253 +/- 0.061 (in 3 folds) MCC: 0.109 +/- 0.116 (in 3 folds) Global scores without abstention: Accuracy: 0.250 MCC: 0.077 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.235 +/- 0.049 (in 3 folds) MCC: 0.138 +/- 0.082 (in 3 folds) Unknown/abstention proportion: 0.090 +/- 0.091 (in 2 folds) ROC-AUC (weighted OvO): 0.541 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.521 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.640 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.625 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.235 MCC: 0.078 Unknown/abstention proportion: 0.061 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.45 0.23 0.30 22  30-40 0.00 0.00 0.00 14  40-50 0.00 0.00 0.00 15  50-60 0.21 0.30 0.25 23  60-70 0.07 0.13 0.10 15  70-80 0.00 0.00 0.00 2  <20 0.36 0.54 0.43 24  Unknown 0.00 0.00 0.00 0  accuracy 0.23 115  macro avg 0.14 0.15 0.13 115 weighted avg 0.21 0.23 0.21 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.598 +/- 0.010 (in 3 folds) ROC-AUC (macro OvO): 0.580 +/- 0.015 (in 3 folds) au-PRC (weighted OvO): 0.661 +/- 0.023 (in 3 folds) au-PRC (macro OvO): 0.648 +/- 0.028 (in 3 folds) Accuracy: 0.281 +/- 0.084 (in 3 folds) MCC: 0.248 +/- 0.092 (in 3 folds) Global scores without abstention: Accuracy: 0.281 MCC: 0.147 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.279 +/- 0.086 (in 3 folds) MCC: 0.246 +/- 0.096 (in 3 folds) Unknown/abstention proportion: 0.026 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.594 +/- 0.009 (in 2 folds) ROC-AUC (macro OvO): 0.573 +/- 0.011 (in 2 folds) au-PRC (weighted OvO): 0.648 +/- 0.006 (in 2 folds) au-PRC (macro OvO): 0.632 +/- 0.008 (in 2 folds) Global scores with abstention: Accuracy: 0.278 MCC: 0.144 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.62 0.23 0.33 22  30-40 0.00 0.00 0.00 14  40-50 0.12 0.20 0.15 15  50-60 0.22 0.30 0.25 23  60-70 0.12 0.27 0.17 15  70-80 0.00 0.00 0.00 2  <20 0.87 0.54 0.67 24  Unknown 0.00 0.00 0.00 0  accuracy 0.28 115  macro avg 0.24 0.19 0.20 115 weighted avg 0.38 0.28 0.29 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.526 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.527 +/- 0.009 (in 3 folds) au-PRC (weighted OvO): 0.539 +/- 0.005 (in 3 folds) au-PRC (macro OvO): 0.540 +/- 0.004 (in 3 folds) Accuracy: 0.213 +/- 0.028 (in 3 folds) MCC: 0.054 +/- 0.033 (in 3 folds) Global scores without abstention: Accuracy: 0.212 MCC: 0.047 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.209 +/- 0.032 (in 3 folds) MCC: 0.056 +/- 0.031 (in 3 folds) Unknown/abstention proportion: 0.051 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.528 +/- 0.014 (in 2 folds) ROC-AUC (macro OvO): 0.526 +/- 0.012 (in 2 folds) au-PRC (weighted OvO): 0.540 +/- 0.006 (in 2 folds) au-PRC (macro OvO): 0.538 +/- 0.004 (in 2 folds) Global scores with abstention: Accuracy: 0.209 MCC: 0.048 Unknown/abstention proportion: 0.017 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.29 0.18 0.22 22  30-40 0.07 0.07 0.07 14  40-50 0.43 0.20 0.27 15  50-60 0.25 0.35 0.29 23  60-70 0.14 0.20 0.17 15  70-80 0.00 0.00 0.00 2  <20 0.21 0.21 0.21 24  Unknown 0.00 0.00 0.00 0  accuracy 0.21 115  macro avg 0.17 0.15 0.15 115 weighted avg 0.23 0.21 0.21 115
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 3 folds) Accuracy: 0.229 +/- 0.064 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.226 MCC: 0.035 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.208 +/- 0.042 (in 3 folds) MCC: 0.042 +/- 0.043 (in 3 folds) Unknown/abstention proportion: 0.115 +/- 0.054 (in 2 folds) ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.500 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.500 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.209 MCC: 0.032 Unknown/abstention proportion: 0.078 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.19 0.32 0.24 22  30-40 0.00 0.00 0.00 14  40-50 0.00 0.00 0.00 15  50-60 0.19 0.30 0.23 23  60-70 0.00 0.00 0.00 15  70-80 0.00 0.00 0.00 2  <20 0.30 0.42 0.35 24  Unknown 0.00 0.00 0.00 0  accuracy 0.21 115  macro avg 0.09 0.13 0.10 115 weighted avg 0.14 0.21 0.17 115


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention
rf_multiclass,0.664 +/- 0.011 (in 3 folds),0.658 +/- 0.004 (in 3 folds),0.682 +/- 0.014 (in 3 folds),0.674 +/- 0.022 (in 3 folds),0.353 +/- 0.041 (in 3 folds),0.278 +/- 0.012 (in 3 folds),0.352,0.216,165.0,0.0,165.0,0.0,True,,,,,,,,,,,
rf_multiclass.decision_thresholds_tuned,0.664 +/- 0.011 (in 3 folds),0.658 +/- 0.004 (in 3 folds),0.682 +/- 0.014 (in 3 folds),0.674 +/- 0.022 (in 3 folds),0.284 +/- 0.019 (in 3 folds),0.235 +/- 0.058 (in 3 folds),0.285,0.147,165.0,0.0,165.0,0.0,True,,,,,,,,,,,
elasticnet_cv,0.642 +/- 0.015 (in 3 folds),0.624 +/- 0.027 (in 3 folds),0.666 +/- 0.031 (in 3 folds),0.652 +/- 0.041 (in 3 folds),0.216 +/- 0.074 (in 3 folds),0.189 +/- 0.093 (in 3 folds),0.212,0.053,165.0,0.0,165.0,0.0,True,,,,,,,,,,,
elasticnet_cv.decision_thresholds_tuned,0.642 +/- 0.015 (in 3 folds),0.624 +/- 0.027 (in 3 folds),0.666 +/- 0.031 (in 3 folds),0.652 +/- 0.041 (in 3 folds),0.367 +/- 0.064 (in 3 folds),0.254 +/- 0.090 (in 3 folds),0.364,0.223,165.0,0.0,165.0,0.0,True,,,,,,,,,,,
ridge_cv,0.640 +/- 0.042 (in 3 folds),0.623 +/- 0.027 (in 3 folds),0.664 +/- 0.007 (in 3 folds),0.650 +/- 0.014 (in 3 folds),0.186 +/- 0.038 (in 3 folds),0.105 +/- 0.112 (in 3 folds),0.182,-0.004,159.0,6.0,165.0,0.036364,True,0.629 +/- 0.052 (in 2 folds),0.615 +/- 0.033 (in 2 folds),0.660 +/- 0.003 (in 2 folds),0.647 +/- 0.019 (in 2 folds),0.177 +/- 0.024 (in 3 folds),0.124 +/- 0.087 (in 3 folds),0.120 +/- 0.000 (in 1 folds),0.176,-0.004,0.036,Unknown
ridge_cv.decision_thresholds_tuned,0.640 +/- 0.042 (in 3 folds),0.623 +/- 0.027 (in 3 folds),0.664 +/- 0.007 (in 3 folds),0.650 +/- 0.014 (in 3 folds),0.296 +/- 0.060 (in 3 folds),0.137 +/- 0.119 (in 3 folds),0.302,0.148,159.0,6.0,165.0,0.036364,True,0.629 +/- 0.052 (in 2 folds),0.615 +/- 0.033 (in 2 folds),0.660 +/- 0.003 (in 2 folds),0.647 +/- 0.019 (in 2 folds),0.287 +/- 0.076 (in 3 folds),0.157 +/- 0.085 (in 3 folds),0.120 +/- 0.000 (in 1 folds),0.291,0.145,0.036,Unknown
lasso_cv,0.637 +/- 0.024 (in 3 folds),0.619 +/- 0.010 (in 3 folds),0.670 +/- 0.018 (in 3 folds),0.657 +/- 0.027 (in 3 folds),0.227 +/- 0.046 (in 3 folds),0.210 +/- 0.030 (in 3 folds),0.224,0.073,165.0,0.0,165.0,0.0,True,,,,,,,,,,,
lasso_cv.decision_thresholds_tuned,0.637 +/- 0.024 (in 3 folds),0.619 +/- 0.010 (in 3 folds),0.670 +/- 0.018 (in 3 folds),0.657 +/- 0.027 (in 3 folds),0.344 +/- 0.102 (in 3 folds),0.271 +/- 0.092 (in 3 folds),0.339,0.213,165.0,0.0,165.0,0.0,True,,,,,,,,,,,
linearsvm_ovr,0.623 +/- 0.054 (in 3 folds),0.605 +/- 0.057 (in 3 folds),0.661 +/- 0.052 (in 3 folds),0.648 +/- 0.056 (in 3 folds),0.344 +/- 0.053 (in 3 folds),0.252 +/- 0.030 (in 3 folds),0.34,0.195,162.0,3.0,165.0,0.018182,True,0.597 +/- 0.044 (in 2 folds),0.583 +/- 0.059 (in 2 folds),0.638 +/- 0.047 (in 2 folds),0.626 +/- 0.058 (in 2 folds),0.336 +/- 0.039 (in 3 folds),0.246 +/- 0.026 (in 3 folds),0.060 +/- 0.000 (in 1 folds),0.333,0.192,0.018,Unknown
linearsvm_ovr.decision_thresholds_tuned,0.623 +/- 0.054 (in 3 folds),0.605 +/- 0.057 (in 3 folds),0.661 +/- 0.052 (in 3 folds),0.648 +/- 0.056 (in 3 folds),0.368 +/- 0.081 (in 3 folds),0.261 +/- 0.056 (in 3 folds),0.364,0.237,162.0,3.0,165.0,0.018182,True,0.597 +/- 0.044 (in 2 folds),0.583 +/- 0.059 (in 2 folds),0.638 +/- 0.047 (in 2 folds),0.626 +/- 0.058 (in 2 folds),0.360 +/- 0.068 (in 3 folds),0.256 +/- 0.050 (in 3 folds),0.060 +/- 0.000 (in 1 folds),0.358,0.231,0.018,Unknown

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention
rf_multiclass,0.664 +/- 0.011 (in 3 folds),0.658 +/- 0.004 (in 3 folds),0.682 +/- 0.014 (in 3 folds),0.674 +/- 0.022 (in 3 folds),0.353 +/- 0.041 (in 3 folds),0.278 +/- 0.012 (in 3 folds),0.352,0.216,165,0,165,0.0,True,,,,,,,,,,,
rf_multiclass.decision_thresholds_tuned,0.664 +/- 0.011 (in 3 folds),0.658 +/- 0.004 (in 3 folds),0.682 +/- 0.014 (in 3 folds),0.674 +/- 0.022 (in 3 folds),0.284 +/- 0.019 (in 3 folds),0.235 +/- 0.058 (in 3 folds),0.285,0.147,165,0,165,0.0,True,,,,,,,,,,,
elasticnet_cv,0.642 +/- 0.015 (in 3 folds),0.624 +/- 0.027 (in 3 folds),0.666 +/- 0.031 (in 3 folds),0.652 +/- 0.041 (in 3 folds),0.216 +/- 0.074 (in 3 folds),0.189 +/- 0.093 (in 3 folds),0.212,0.053,165,0,165,0.0,True,,,,,,,,,,,
elasticnet_cv.decision_thresholds_tuned,0.642 +/- 0.015 (in 3 folds),0.624 +/- 0.027 (in 3 folds),0.666 +/- 0.031 (in 3 folds),0.652 +/- 0.041 (in 3 folds),0.367 +/- 0.064 (in 3 folds),0.254 +/- 0.090 (in 3 folds),0.364,0.223,165,0,165,0.0,True,,,,,,,,,,,
ridge_cv,0.640 +/- 0.042 (in 3 folds),0.623 +/- 0.027 (in 3 folds),0.664 +/- 0.007 (in 3 folds),0.650 +/- 0.014 (in 3 folds),0.186 +/- 0.038 (in 3 folds),0.105 +/- 0.112 (in 3 folds),0.182,-0.004,159,6,165,0.036364,True,0.629 +/- 0.052 (in 2 folds),0.615 +/- 0.033 (in 2 folds),0.660 +/- 0.003 (in 2 folds),0.647 +/- 0.019 (in 2 folds),0.177 +/- 0.024 (in 3 folds),0.124 +/- 0.087 (in 3 folds),0.120 +/- 0.000 (in 1 folds),0.176,-0.004,0.036,Unknown
ridge_cv.decision_thresholds_tuned,0.640 +/- 0.042 (in 3 folds),0.623 +/- 0.027 (in 3 folds),0.664 +/- 0.007 (in 3 folds),0.650 +/- 0.014 (in 3 folds),0.296 +/- 0.060 (in 3 folds),0.137 +/- 0.119 (in 3 folds),0.302,0.148,159,6,165,0.036364,True,0.629 +/- 0.052 (in 2 folds),0.615 +/- 0.033 (in 2 folds),0.660 +/- 0.003 (in 2 folds),0.647 +/- 0.019 (in 2 folds),0.287 +/- 0.076 (in 3 folds),0.157 +/- 0.085 (in 3 folds),0.120 +/- 0.000 (in 1 folds),0.291,0.145,0.036,Unknown
lasso_cv,0.637 +/- 0.024 (in 3 folds),0.619 +/- 0.010 (in 3 folds),0.670 +/- 0.018 (in 3 folds),0.657 +/- 0.027 (in 3 folds),0.227 +/- 0.046 (in 3 folds),0.210 +/- 0.030 (in 3 folds),0.224,0.073,165,0,165,0.0,True,,,,,,,,,,,
lasso_cv.decision_thresholds_tuned,0.637 +/- 0.024 (in 3 folds),0.619 +/- 0.010 (in 3 folds),0.670 +/- 0.018 (in 3 folds),0.657 +/- 0.027 (in 3 folds),0.344 +/- 0.102 (in 3 folds),0.271 +/- 0.092 (in 3 folds),0.339,0.213,165,0,165,0.0,True,,,,,,,,,,,
linearsvm_ovr,0.623 +/- 0.054 (in 3 folds),0.605 +/- 0.057 (in 3 folds),0.661 +/- 0.052 (in 3 folds),0.648 +/- 0.056 (in 3 folds),0.344 +/- 0.053 (in 3 folds),0.252 +/- 0.030 (in 3 folds),0.34,0.195,162,3,165,0.018182,True,0.597 +/- 0.044 (in 2 folds),0.583 +/- 0.059 (in 2 folds),0.638 +/- 0.047 (in 2 folds),0.626 +/- 0.058 (in 2 folds),0.336 +/- 0.039 (in 3 folds),0.246 +/- 0.026 (in 3 folds),0.060 +/- 0.000 (in 1 folds),0.333,0.192,0.018,Unknown
linearsvm_ovr.decision_thresholds_tuned,0.623 +/- 0.054 (in 3 folds),0.605 +/- 0.057 (in 3 folds),0.661 +/- 0.052 (in 3 folds),0.648 +/- 0.056 (in 3 folds),0.368 +/- 0.081 (in 3 folds),0.261 +/- 0.056 (in 3 folds),0.364,0.237,162,3,165,0.018182,True,0.597 +/- 0.044 (in 2 folds),0.583 +/- 0.059 (in 2 folds),0.638 +/- 0.047 (in 2 folds),0.626 +/- 0.058 (in 2 folds),0.360 +/- 0.068 (in 3 folds),0.256 +/- 0.050 (in 3 folds),0.060 +/- 0.000 (in 1 folds),0.358,0.231,0.018,Unknown


rf_multiclass,rf_multiclass.decision_thresholds_tuned,elasticnet_cv,elasticnet_cv.decision_thresholds_tuned
Per-fold scores: ROC-AUC (weighted OvO): 0.664 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.658 +/- 0.004 (in 3 folds) au-PRC (weighted OvO): 0.682 +/- 0.014 (in 3 folds) au-PRC (macro OvO): 0.674 +/- 0.022 (in 3 folds) Accuracy: 0.353 +/- 0.041 (in 3 folds) MCC: 0.278 +/- 0.012 (in 3 folds) Global scores: Accuracy: 0.352 MCC: 0.216 Global classification report:  precision recall f1-score support  20-30 0.34 0.53 0.42 30  30-40 0.08 0.06 0.07 18  40-50 0.33 0.12 0.18 24  50-60 0.19 0.22 0.21 32  60-70 0.17 0.21 0.19 24  70-80 0.00 0.00 0.00 2  <20 0.84 0.74 0.79 35  accuracy 0.35 165  macro avg 0.28 0.27 0.26 165 weighted avg 0.36 0.35 0.34 165,Per-fold scores: ROC-AUC (weighted OvO): 0.664 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.658 +/- 0.004 (in 3 folds) au-PRC (weighted OvO): 0.682 +/- 0.014 (in 3 folds) au-PRC (macro OvO): 0.674 +/- 0.022 (in 3 folds) Accuracy: 0.284 +/- 0.019 (in 3 folds) MCC: 0.235 +/- 0.058 (in 3 folds) Global scores: Accuracy: 0.285 MCC: 0.147 Global classification report:  precision recall f1-score support  20-30 0.33 0.10 0.15 30  30-40 0.25 0.06 0.09 18  40-50 0.17 0.04 0.07 24  50-60 0.16 0.22 0.18 32  60-70 0.13 0.38 0.19 24  70-80 0.00 0.00 0.00 2  <20 0.84 0.74 0.79 35  accuracy 0.28 165  macro avg 0.27 0.22 0.21 165 weighted avg 0.34 0.28 0.28 165,Per-fold scores: ROC-AUC (weighted OvO): 0.642 +/- 0.015 (in 3 folds) ROC-AUC (macro OvO): 0.624 +/- 0.027 (in 3 folds) au-PRC (weighted OvO): 0.666 +/- 0.031 (in 3 folds) au-PRC (macro OvO): 0.652 +/- 0.041 (in 3 folds) Accuracy: 0.216 +/- 0.074 (in 3 folds) MCC: 0.189 +/- 0.093 (in 3 folds) Global scores: Accuracy: 0.212 MCC: 0.053 Global classification report:  precision recall f1-score support  20-30 0.31 0.13 0.19 30  30-40 0.00 0.00 0.00 18  40-50 0.17 0.21 0.19 24  50-60 0.11 0.16 0.13 32  60-70 0.10 0.21 0.14 24  70-80 0.00 0.00 0.00 2  <20 0.76 0.46 0.57 35  accuracy 0.21 165  macro avg 0.21 0.17 0.17 165 weighted avg 0.28 0.21 0.23 165,Per-fold scores: ROC-AUC (weighted OvO): 0.642 +/- 0.015 (in 3 folds) ROC-AUC (macro OvO): 0.624 +/- 0.027 (in 3 folds) au-PRC (weighted OvO): 0.666 +/- 0.031 (in 3 folds) au-PRC (macro OvO): 0.652 +/- 0.041 (in 3 folds) Accuracy: 0.367 +/- 0.064 (in 3 folds) MCC: 0.254 +/- 0.090 (in 3 folds) Global scores: Accuracy: 0.364 MCC: 0.223 Global classification report:  precision recall f1-score support  20-30 0.27 0.47 0.35 30  30-40 0.00 0.00 0.00 18  40-50 0.22 0.08 0.12 24  50-60 0.34 0.44 0.38 32  60-70 0.00 0.00 0.00 24  70-80 0.00 0.00 0.00 2  <20 0.48 0.86 0.61 35  accuracy 0.36 165  macro avg 0.19 0.26 0.21 165 weighted avg 0.25 0.36 0.28 165
,,,


ridge_cv,ridge_cv.decision_thresholds_tuned,lasso_cv,lasso_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.640 +/- 0.042 (in 3 folds) ROC-AUC (macro OvO): 0.623 +/- 0.027 (in 3 folds) au-PRC (weighted OvO): 0.664 +/- 0.007 (in 3 folds) au-PRC (macro OvO): 0.650 +/- 0.014 (in 3 folds) Accuracy: 0.186 +/- 0.038 (in 3 folds) MCC: 0.105 +/- 0.112 (in 3 folds) Global scores without abstention: Accuracy: 0.182 MCC: -0.004 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.629 +/- 0.052 (in 2 folds) ROC-AUC (macro OvO): 0.615 +/- 0.033 (in 2 folds) au-PRC (weighted OvO): 0.660 +/- 0.003 (in 2 folds) au-PRC (macro OvO): 0.647 +/- 0.019 (in 2 folds) Accuracy: 0.177 +/- 0.024 (in 3 folds) MCC: 0.124 +/- 0.087 (in 3 folds) Unknown/abstention proportion: 0.120 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.176 MCC: -0.004 Unknown/abstention proportion: 0.036 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.24 0.13 0.17 30  30-40 0.00 0.00 0.00 18  40-50 0.00 0.00 0.00 24  50-60 0.10 0.16 0.12 32  60-70 0.12 0.21 0.15 24  70-80 0.00 0.00 0.00 2  <20 0.31 0.43 0.36 35  Unknown 0.00 0.00 0.00 0  accuracy 0.18 165  macro avg 0.09 0.12 0.10 165 weighted avg 0.14 0.18 0.15 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.640 +/- 0.042 (in 3 folds) ROC-AUC (macro OvO): 0.623 +/- 0.027 (in 3 folds) au-PRC (weighted OvO): 0.664 +/- 0.007 (in 3 folds) au-PRC (macro OvO): 0.650 +/- 0.014 (in 3 folds) Accuracy: 0.296 +/- 0.060 (in 3 folds) MCC: 0.137 +/- 0.119 (in 3 folds) Global scores without abstention: Accuracy: 0.302 MCC: 0.148 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.629 +/- 0.052 (in 2 folds) ROC-AUC (macro OvO): 0.615 +/- 0.033 (in 2 folds) au-PRC (weighted OvO): 0.660 +/- 0.003 (in 2 folds) au-PRC (macro OvO): 0.647 +/- 0.019 (in 2 folds) Accuracy: 0.287 +/- 0.076 (in 3 folds) MCC: 0.157 +/- 0.085 (in 3 folds) Unknown/abstention proportion: 0.120 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.291 MCC: 0.145 Unknown/abstention proportion: 0.036 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.25 0.47 0.33 30  30-40 0.00 0.00 0.00 18  40-50 0.14 0.04 0.06 24  50-60 0.00 0.00 0.00 32  60-70 0.00 0.00 0.00 24  70-80 0.00 0.00 0.00 2  <20 0.36 0.94 0.52 35  Unknown 0.00 0.00 0.00 0  accuracy 0.29 165  macro avg 0.09 0.18 0.11 165 weighted avg 0.14 0.29 0.18 165,Per-fold scores: ROC-AUC (weighted OvO): 0.637 +/- 0.024 (in 3 folds) ROC-AUC (macro OvO): 0.619 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.670 +/- 0.018 (in 3 folds) au-PRC (macro OvO): 0.657 +/- 0.027 (in 3 folds) Accuracy: 0.227 +/- 0.046 (in 3 folds) MCC: 0.210 +/- 0.030 (in 3 folds) Global scores: Accuracy: 0.224 MCC: 0.073 Global classification report:  precision recall f1-score support  20-30 0.30 0.10 0.15 30  30-40 0.00 0.00 0.00 18  40-50 0.11 0.04 0.06 24  50-60 0.10 0.16 0.12 32  60-70 0.13 0.42 0.20 24  70-80 0.00 0.00 0.00 2  <20 0.95 0.51 0.67 35  accuracy 0.22 165  macro avg 0.23 0.18 0.17 165 weighted avg 0.31 0.22 0.23 165,Per-fold scores: ROC-AUC (weighted OvO): 0.637 +/- 0.024 (in 3 folds) ROC-AUC (macro OvO): 0.619 +/- 0.010 (in 3 folds) au-PRC (weighted OvO): 0.670 +/- 0.018 (in 3 folds) au-PRC (macro OvO): 0.657 +/- 0.027 (in 3 folds) Accuracy: 0.344 +/- 0.102 (in 3 folds) MCC: 0.271 +/- 0.092 (in 3 folds) Global scores: Accuracy: 0.339 MCC: 0.213 Global classification report:  precision recall f1-score support  20-30 0.22 0.33 0.26 30  30-40 0.00 0.00 0.00 18  40-50 0.00 0.00 0.00 24  50-60 0.24 0.72 0.36 32  60-70 0.00 0.00 0.00 24  70-80 0.00 0.00 0.00 2  <20 0.96 0.66 0.78 35  accuracy 0.34 165  macro avg 0.20 0.24 0.20 165 weighted avg 0.29 0.34 0.28 165
,,,


linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned,xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.623 +/- 0.054 (in 3 folds) ROC-AUC (macro OvO): 0.605 +/- 0.057 (in 3 folds) au-PRC (weighted OvO): 0.661 +/- 0.052 (in 3 folds) au-PRC (macro OvO): 0.648 +/- 0.056 (in 3 folds) Accuracy: 0.344 +/- 0.053 (in 3 folds) MCC: 0.252 +/- 0.030 (in 3 folds) Global scores without abstention: Accuracy: 0.340 MCC: 0.195 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.597 +/- 0.044 (in 2 folds) ROC-AUC (macro OvO): 0.583 +/- 0.059 (in 2 folds) au-PRC (weighted OvO): 0.638 +/- 0.047 (in 2 folds) au-PRC (macro OvO): 0.626 +/- 0.058 (in 2 folds) Accuracy: 0.336 +/- 0.039 (in 3 folds) MCC: 0.246 +/- 0.026 (in 3 folds) Unknown/abstention proportion: 0.060 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.333 MCC: 0.192 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.32 0.47 0.38 30  30-40 0.00 0.00 0.00 18  40-50 0.25 0.12 0.17 24  50-60 0.20 0.25 0.22 32  60-70 0.10 0.12 0.11 24  70-80 0.00 0.00 0.00 2  <20 0.77 0.77 0.77 35  Unknown 0.00 0.00 0.00 0  accuracy 0.33 165  macro avg 0.20 0.22 0.21 165 weighted avg 0.31 0.33 0.32 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.623 +/- 0.054 (in 3 folds) ROC-AUC (macro OvO): 0.605 +/- 0.057 (in 3 folds) au-PRC (weighted OvO): 0.661 +/- 0.052 (in 3 folds) au-PRC (macro OvO): 0.648 +/- 0.056 (in 3 folds) Accuracy: 0.368 +/- 0.081 (in 3 folds) MCC: 0.261 +/- 0.056 (in 3 folds) Global scores without abstention: Accuracy: 0.364 MCC: 0.237 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.597 +/- 0.044 (in 2 folds) ROC-AUC (macro OvO): 0.583 +/- 0.059 (in 2 folds) au-PRC (weighted OvO): 0.638 +/- 0.047 (in 2 folds) au-PRC (macro OvO): 0.626 +/- 0.058 (in 2 folds) Accuracy: 0.360 +/- 0.068 (in 3 folds) MCC: 0.256 +/- 0.050 (in 3 folds) Unknown/abstention proportion: 0.060 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.358 MCC: 0.231 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.34 0.60 0.43 30  30-40 0.00 0.00 0.00 18  40-50 0.00 0.00 0.00 24  50-60 0.25 0.59 0.35 32  60-70 0.00 0.00 0.00 24  70-80 0.00 0.00 0.00 2  <20 0.76 0.63 0.69 35  Unknown 0.00 0.00 0.00 0  accuracy 0.36 165  macro avg 0.17 0.23 0.18 165 weighted avg 0.27 0.36 0.29 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.622 +/- 0.053 (in 3 folds) ROC-AUC (macro OvO): 0.598 +/- 0.060 (in 3 folds) au-PRC (weighted OvO): 0.654 +/- 0.048 (in 3 folds) au-PRC (macro OvO): 0.635 +/- 0.051 (in 3 folds) Accuracy: 0.289 +/- 0.049 (in 3 folds) MCC: 0.156 +/- 0.027 (in 3 folds) Global scores without abstention: Accuracy: 0.287 MCC: 0.136 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.630 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.626 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.667 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.660 +/- 0.000 (in 1 folds) Accuracy: 0.272 +/- 0.037 (in 3 folds) MCC: 0.148 +/- 0.020 (in 3 folds) Unknown/abstention proportion: 0.077 +/- 0.061 (in 2 folds) Global scores with abstention: Accuracy: 0.273 MCC: 0.125 Unknown/abstention proportion: 0.048 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.27 0.33 0.30 30  30-40 0.00 0.00 0.00 18  40-50 0.00 0.00 0.00 24  50-60 0.16 0.25 0.20 32  60-70 0.09 0.04 0.06 24  70-80 0.00 0.00 0.00 2  <20 0.87 0.74 0.80 35  Unknown 0.00 0.00 0.00 0  accuracy 0.27 165  macro avg 0.17 0.17 0.17 165 weighted avg 0.28 0.27 0.27 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.622 +/- 0.053 (in 3 folds) ROC-AUC (macro OvO): 0.598 +/- 0.060 (in 3 folds) au-PRC (weighted OvO): 0.654 +/- 0.048 (in 3 folds) au-PRC (macro OvO): 0.635 +/- 0.051 (in 3 folds) Accuracy: 0.355 +/- 0.053 (in 3 folds) MCC: 0.206 +/- 0.061 (in 3 folds) Global scores without abstention: Accuracy: 0.350 MCC: 0.213 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.630 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.626 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.667 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.660 +/- 0.000 (in 1 folds) Accuracy: 0.334 +/- 0.029 (in 3 folds) MCC: 0.191 +/- 0.043 (in 3 folds) Unknown/abstention proportion: 0.077 +/- 0.061 (in 2 folds) Global scores with abstention: Accuracy: 0.333 MCC: 0.198 Unknown/abstention proportion: 0.048 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  20-30 0.33 0.63 0.43 30  30-40 0.00 0.00 0.00 18  40-50 0.09 0.04 0.06 24  50-60 0.22 0.28 0.25 32  60-70 0.12 0.08 0.10 24  70-80 0.00 0.00 0.00 2  <20 0.77 0.69 0.73 35  Unknown 0.00 0.00 0.00 0  accuracy 0.33 165  macro avg 0.19 0.22 0.20 165 weighted avg 0.30 0.33 0.30 165
,,,


lasso_multiclass,lasso_multiclass.decision_thresholds_tuned
Per-fold scores: ROC-AUC (weighted OvO): 0.607 +/- 0.041 (in 3 folds) ROC-AUC (macro OvO): 0.589 +/- 0.046 (in 3 folds) au-PRC (weighted OvO): 0.650 +/- 0.043 (in 3 folds) au-PRC (macro OvO): 0.637 +/- 0.051 (in 3 folds) Accuracy: 0.248 +/- 0.030 (in 3 folds) MCC: 0.174 +/- 0.013 (in 3 folds) Global scores: Accuracy: 0.248 MCC: 0.096 Global classification report:  precision recall f1-score support  20-30 0.26 0.17 0.20 30  30-40 0.05 0.06 0.05 18  40-50 0.00 0.00 0.00 24  50-60 0.13 0.19 0.15 32  60-70 0.10 0.17 0.12 24  70-80 0.00 0.00 0.00 2  <20 0.89 0.71 0.79 35  accuracy 0.25 165  macro avg 0.20 0.18 0.19 165 weighted avg 0.28 0.25 0.26 165,Per-fold scores: ROC-AUC (weighted OvO): 0.607 +/- 0.041 (in 3 folds) ROC-AUC (macro OvO): 0.589 +/- 0.046 (in 3 folds) au-PRC (weighted OvO): 0.650 +/- 0.043 (in 3 folds) au-PRC (macro OvO): 0.637 +/- 0.051 (in 3 folds) Accuracy: 0.311 +/- 0.086 (in 3 folds) MCC: 0.240 +/- 0.069 (in 3 folds) Global scores: Accuracy: 0.315 MCC: 0.175 Global classification report:  precision recall f1-score support  20-30 0.35 0.27 0.30 30  30-40 0.11 0.06 0.07 18  40-50 0.00 0.00 0.00 24  50-60 0.21 0.50 0.30 32  60-70 0.10 0.12 0.11 24  70-80 0.00 0.00 0.00 2  <20 0.96 0.69 0.80 35  accuracy 0.32 165  macro avg 0.25 0.23 0.23 165 weighted avg 0.33 0.32 0.31 165
,


---

# GeneLocus.TCR, TargetObsColumnEnum.age_group_binary_healthy_only trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
lasso_multiclass,0.755 +/- 0.061 (in 3 folds),0.755 +/- 0.061 (in 3 folds),0.871 +/- 0.049 (in 3 folds),0.871 +/- 0.049 (in 3 folds),0.697 +/- 0.036 (in 3 folds),0.339 +/- 0.076 (in 3 folds),0.696,0.331,0.679 +/- 0.033 (in 3 folds),0.320 +/- 0.058 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.678,0.313,0.026,Unknown,112.0,3.0,115.0,0.026087,False,0.801 +/- 0.000 (in 1 folds),0.801 +/- 0.000 (in 1 folds),0.926 +/- 0.000 (in 1 folds),0.926 +/- 0.000 (in 1 folds)
linearsvm_ovr,0.743 +/- 0.055 (in 3 folds),0.743 +/- 0.055 (in 3 folds),0.864 +/- 0.029 (in 3 folds),0.864 +/- 0.029 (in 3 folds),0.706 +/- 0.050 (in 3 folds),0.334 +/- 0.134 (in 3 folds),0.705,0.34,0.687 +/- 0.041 (in 3 folds),0.313 +/- 0.110 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.687,0.32,0.026,Unknown,112.0,3.0,115.0,0.026087,False,0.745 +/- 0.000 (in 1 folds),0.745 +/- 0.000 (in 1 folds),0.887 +/- 0.000 (in 1 folds),0.887 +/- 0.000 (in 1 folds)
elasticnet_cv,0.701 +/- 0.136 (in 2 folds),0.701 +/- 0.136 (in 2 folds),0.820 +/- 0.076 (in 2 folds),0.820 +/- 0.076 (in 2 folds),0.781 +/- 0.190 (in 3 folds),0.101 +/- 0.174 (in 3 folds),0.714,0.256,0.518 +/- 0.191 (in 3 folds),0.160 +/- 0.142 (in 3 folds),0.277 +/- 0.369 (in 3 folds),0.522,0.146,0.27,Unknown,84.0,31.0,115.0,0.269565,False,,,,
ridge_cv,0.690 +/- 0.117 (in 2 folds),0.690 +/- 0.117 (in 2 folds),0.811 +/- 0.054 (in 2 folds),0.811 +/- 0.054 (in 2 folds),0.754 +/- 0.216 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.679,0.0,0.492 +/- 0.171 (in 3 folds),0.078 +/- 0.116 (in 3 folds),0.277 +/- 0.369 (in 3 folds),0.496,0.046,0.27,Unknown,84.0,31.0,115.0,0.269565,True,,,,
lasso_cv,0.688 +/- 0.119 (in 2 folds),0.688 +/- 0.119 (in 2 folds),0.807 +/- 0.058 (in 2 folds),0.807 +/- 0.058 (in 2 folds),0.808 +/- 0.172 (in 3 folds),0.204 +/- 0.253 (in 3 folds),0.75,0.38,0.544 +/- 0.219 (in 3 folds),0.247 +/- 0.176 (in 3 folds),0.277 +/- 0.369 (in 3 folds),0.548,0.226,0.27,Unknown,84.0,31.0,115.0,0.269565,False,,,,
xgboost,0.647 +/- 0.024 (in 3 folds),0.647 +/- 0.024 (in 3 folds),0.749 +/- 0.070 (in 3 folds),0.749 +/- 0.070 (in 3 folds),0.688 +/- 0.063 (in 3 folds),0.285 +/- 0.118 (in 3 folds),0.688,0.292,0.671 +/- 0.075 (in 3 folds),0.270 +/- 0.123 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.67,0.275,0.026,Unknown,112.0,3.0,115.0,0.026087,False,0.673 +/- 0.000 (in 1 folds),0.673 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds)
rf_multiclass,0.626 +/- 0.063 (in 3 folds),0.626 +/- 0.063 (in 3 folds),0.760 +/- 0.045 (in 3 folds),0.760 +/- 0.045 (in 3 folds),0.679 +/- 0.065 (in 3 folds),0.233 +/- 0.148 (in 3 folds),0.679,0.238,0.662 +/- 0.070 (in 3 folds),0.216 +/- 0.140 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.661,0.221,0.026,Unknown,112.0,3.0,115.0,0.026087,False,0.556 +/- 0.000 (in 1 folds),0.556 +/- 0.000 (in 1 folds),0.781 +/- 0.000 (in 1 folds),0.781 +/- 0.000 (in 1 folds)
dummy_stratified,0.585 +/- 0.027 (in 2 folds),0.585 +/- 0.027 (in 2 folds),0.671 +/- 0.066 (in 2 folds),0.671 +/- 0.066 (in 2 folds),0.713 +/- 0.172 (in 3 folds),0.114 +/- 0.104 (in 3 folds),0.651,0.206,0.483 +/- 0.184 (in 3 folds),0.161 +/- 0.021 (in 3 folds),0.390 +/- 0.442 (in 2 folds),0.487,0.138,0.252,Unknown,86.0,29.0,115.0,0.252174,False,0.567 +/- 0.000 (in 1 folds),0.567 +/- 0.000 (in 1 folds),0.625 +/- 0.000 (in 1 folds),0.625 +/- 0.000 (in 1 folds)
dummy_most_frequent,0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.631 +/- 0.051 (in 2 folds),0.631 +/- 0.051 (in 2 folds),0.754 +/- 0.216 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.679,0.0,0.492 +/- 0.171 (in 3 folds),0.078 +/- 0.116 (in 3 folds),0.277 +/- 0.369 (in 3 folds),0.496,0.046,0.27,Unknown,84.0,31.0,115.0,0.269565,True,,,,
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
lasso_multiclass,0.755 +/- 0.061 (in 3 folds),0.755 +/- 0.061 (in 3 folds),0.871 +/- 0.049 (in 3 folds),0.871 +/- 0.049 (in 3 folds),0.697 +/- 0.036 (in 3 folds),0.339 +/- 0.076 (in 3 folds),0.696,0.331,0.679 +/- 0.033 (in 3 folds),0.320 +/- 0.058 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.678,0.313,0.026,Unknown,112,3,115,0.026087,False,0.801 +/- 0.000 (in 1 folds),0.801 +/- 0.000 (in 1 folds),0.926 +/- 0.000 (in 1 folds),0.926 +/- 0.000 (in 1 folds)
linearsvm_ovr,0.743 +/- 0.055 (in 3 folds),0.743 +/- 0.055 (in 3 folds),0.864 +/- 0.029 (in 3 folds),0.864 +/- 0.029 (in 3 folds),0.706 +/- 0.050 (in 3 folds),0.334 +/- 0.134 (in 3 folds),0.705,0.34,0.687 +/- 0.041 (in 3 folds),0.313 +/- 0.110 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.687,0.32,0.026,Unknown,112,3,115,0.026087,False,0.745 +/- 0.000 (in 1 folds),0.745 +/- 0.000 (in 1 folds),0.887 +/- 0.000 (in 1 folds),0.887 +/- 0.000 (in 1 folds)
elasticnet_cv,0.701 +/- 0.136 (in 2 folds),0.701 +/- 0.136 (in 2 folds),0.820 +/- 0.076 (in 2 folds),0.820 +/- 0.076 (in 2 folds),0.781 +/- 0.190 (in 3 folds),0.101 +/- 0.174 (in 3 folds),0.714,0.256,0.518 +/- 0.191 (in 3 folds),0.160 +/- 0.142 (in 3 folds),0.277 +/- 0.369 (in 3 folds),0.522,0.146,0.27,Unknown,84,31,115,0.269565,False,,,,
ridge_cv,0.690 +/- 0.117 (in 2 folds),0.690 +/- 0.117 (in 2 folds),0.811 +/- 0.054 (in 2 folds),0.811 +/- 0.054 (in 2 folds),0.754 +/- 0.216 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.679,0.0,0.492 +/- 0.171 (in 3 folds),0.078 +/- 0.116 (in 3 folds),0.277 +/- 0.369 (in 3 folds),0.496,0.046,0.27,Unknown,84,31,115,0.269565,True,,,,
lasso_cv,0.688 +/- 0.119 (in 2 folds),0.688 +/- 0.119 (in 2 folds),0.807 +/- 0.058 (in 2 folds),0.807 +/- 0.058 (in 2 folds),0.808 +/- 0.172 (in 3 folds),0.204 +/- 0.253 (in 3 folds),0.75,0.38,0.544 +/- 0.219 (in 3 folds),0.247 +/- 0.176 (in 3 folds),0.277 +/- 0.369 (in 3 folds),0.548,0.226,0.27,Unknown,84,31,115,0.269565,False,,,,
xgboost,0.647 +/- 0.024 (in 3 folds),0.647 +/- 0.024 (in 3 folds),0.749 +/- 0.070 (in 3 folds),0.749 +/- 0.070 (in 3 folds),0.688 +/- 0.063 (in 3 folds),0.285 +/- 0.118 (in 3 folds),0.688,0.292,0.671 +/- 0.075 (in 3 folds),0.270 +/- 0.123 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.67,0.275,0.026,Unknown,112,3,115,0.026087,False,0.673 +/- 0.000 (in 1 folds),0.673 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds)
rf_multiclass,0.626 +/- 0.063 (in 3 folds),0.626 +/- 0.063 (in 3 folds),0.760 +/- 0.045 (in 3 folds),0.760 +/- 0.045 (in 3 folds),0.679 +/- 0.065 (in 3 folds),0.233 +/- 0.148 (in 3 folds),0.679,0.238,0.662 +/- 0.070 (in 3 folds),0.216 +/- 0.140 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.661,0.221,0.026,Unknown,112,3,115,0.026087,False,0.556 +/- 0.000 (in 1 folds),0.556 +/- 0.000 (in 1 folds),0.781 +/- 0.000 (in 1 folds),0.781 +/- 0.000 (in 1 folds)
dummy_stratified,0.585 +/- 0.027 (in 2 folds),0.585 +/- 0.027 (in 2 folds),0.671 +/- 0.066 (in 2 folds),0.671 +/- 0.066 (in 2 folds),0.713 +/- 0.172 (in 3 folds),0.114 +/- 0.104 (in 3 folds),0.651,0.206,0.483 +/- 0.184 (in 3 folds),0.161 +/- 0.021 (in 3 folds),0.390 +/- 0.442 (in 2 folds),0.487,0.138,0.252,Unknown,86,29,115,0.252174,False,0.567 +/- 0.000 (in 1 folds),0.567 +/- 0.000 (in 1 folds),0.625 +/- 0.000 (in 1 folds),0.625 +/- 0.000 (in 1 folds)
dummy_most_frequent,0.500 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 2 folds),0.631 +/- 0.051 (in 2 folds),0.631 +/- 0.051 (in 2 folds),0.754 +/- 0.216 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.679,0.0,0.492 +/- 0.171 (in 3 folds),0.078 +/- 0.116 (in 3 folds),0.277 +/- 0.369 (in 3 folds),0.496,0.046,0.27,Unknown,84,31,115,0.269565,True,,,,


lasso_multiclass,linearsvm_ovr,elasticnet_cv,ridge_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.755 +/- 0.061 (in 3 folds) ROC-AUC (macro OvO): 0.755 +/- 0.061 (in 3 folds) au-PRC (weighted OvO): 0.871 +/- 0.049 (in 3 folds) au-PRC (macro OvO): 0.871 +/- 0.049 (in 3 folds) Accuracy: 0.697 +/- 0.036 (in 3 folds) MCC: 0.339 +/- 0.076 (in 3 folds) Global scores without abstention: Accuracy: 0.696 MCC: 0.331 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.679 +/- 0.033 (in 3 folds) MCC: 0.320 +/- 0.058 (in 3 folds) Unknown/abstention proportion: 0.038 +/- 0.018 (in 2 folds) ROC-AUC (weighted OvO): 0.801 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.801 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.926 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.926 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.678 MCC: 0.313 Unknown/abstention proportion: 0.026 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.56 0.55 0.56 40  Unknown 0.00 0.00 0.00 0  under 50 0.77 0.75 0.76 75  accuracy 0.68 115  macro avg 0.44 0.43 0.44 115 weighted avg 0.70 0.68 0.69 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.743 +/- 0.055 (in 3 folds) ROC-AUC (macro OvO): 0.743 +/- 0.055 (in 3 folds) au-PRC (weighted OvO): 0.864 +/- 0.029 (in 3 folds) au-PRC (macro OvO): 0.864 +/- 0.029 (in 3 folds) Accuracy: 0.706 +/- 0.050 (in 3 folds) MCC: 0.334 +/- 0.134 (in 3 folds) Global scores without abstention: Accuracy: 0.705 MCC: 0.340 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.687 +/- 0.041 (in 3 folds) MCC: 0.313 +/- 0.110 (in 3 folds) Unknown/abstention proportion: 0.038 +/- 0.018 (in 2 folds) ROC-AUC (weighted OvO): 0.745 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.745 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.887 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.887 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.687 MCC: 0.320 Unknown/abstention proportion: 0.026 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.58 0.53 0.55 40  Unknown 0.00 0.00 0.00 0  under 50 0.76 0.77 0.77 75  accuracy 0.69 115  macro avg 0.45 0.43 0.44 115 weighted avg 0.70 0.69 0.69 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.701 +/- 0.136 (in 2 folds) ROC-AUC (macro OvO): 0.701 +/- 0.136 (in 2 folds) au-PRC (weighted OvO): 0.820 +/- 0.076 (in 2 folds) au-PRC (macro OvO): 0.820 +/- 0.076 (in 2 folds) Accuracy: 0.781 +/- 0.190 (in 3 folds) MCC: 0.101 +/- 0.174 (in 3 folds) Global scores without abstention: Accuracy: 0.714 MCC: 0.256 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.518 +/- 0.191 (in 3 folds) MCC: 0.160 +/- 0.142 (in 3 folds) Unknown/abstention proportion: 0.277 +/- 0.369 (in 3 folds) Global scores with abstention: Accuracy: 0.522 MCC: 0.146 Unknown/abstention proportion: 0.270 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.67 0.15 0.24 40  Unknown 0.00 0.00 0.00 0  under 50 0.72 0.72 0.72 75  accuracy 0.52 115  macro avg 0.46 0.29 0.32 115 weighted avg 0.70 0.52 0.55 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.690 +/- 0.117 (in 2 folds) ROC-AUC (macro OvO): 0.690 +/- 0.117 (in 2 folds) au-PRC (weighted OvO): 0.811 +/- 0.054 (in 2 folds) au-PRC (macro OvO): 0.811 +/- 0.054 (in 2 folds) Accuracy: 0.754 +/- 0.216 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.679 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.492 +/- 0.171 (in 3 folds) MCC: 0.078 +/- 0.116 (in 3 folds) Unknown/abstention proportion: 0.277 +/- 0.369 (in 3 folds) Global scores with abstention: Accuracy: 0.496 MCC: 0.046 Unknown/abstention proportion: 0.270 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.00 0.00 0.00 40  Unknown 0.00 0.00 0.00 0  under 50 0.68 0.76 0.72 75  accuracy 0.50 115  macro avg 0.23 0.25 0.24 115 weighted avg 0.44 0.50 0.47 115
,,,


lasso_cv,xgboost,rf_multiclass,dummy_stratified
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.688 +/- 0.119 (in 2 folds) ROC-AUC (macro OvO): 0.688 +/- 0.119 (in 2 folds) au-PRC (weighted OvO): 0.807 +/- 0.058 (in 2 folds) au-PRC (macro OvO): 0.807 +/- 0.058 (in 2 folds) Accuracy: 0.808 +/- 0.172 (in 3 folds) MCC: 0.204 +/- 0.253 (in 3 folds) Global scores without abstention: Accuracy: 0.750 MCC: 0.380 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.544 +/- 0.219 (in 3 folds) MCC: 0.247 +/- 0.176 (in 3 folds) Unknown/abstention proportion: 0.277 +/- 0.369 (in 3 folds) Global scores with abstention: Accuracy: 0.548 MCC: 0.226 Unknown/abstention proportion: 0.270 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.69 0.28 0.39 40  Unknown 0.00 0.00 0.00 0  under 50 0.76 0.69 0.73 75  accuracy 0.55 115  macro avg 0.48 0.32 0.37 115 weighted avg 0.74 0.55 0.61 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.647 +/- 0.024 (in 3 folds) ROC-AUC (macro OvO): 0.647 +/- 0.024 (in 3 folds) au-PRC (weighted OvO): 0.749 +/- 0.070 (in 3 folds) au-PRC (macro OvO): 0.749 +/- 0.070 (in 3 folds) Accuracy: 0.688 +/- 0.063 (in 3 folds) MCC: 0.285 +/- 0.118 (in 3 folds) Global scores without abstention: Accuracy: 0.688 MCC: 0.292 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.671 +/- 0.075 (in 3 folds) MCC: 0.270 +/- 0.123 (in 3 folds) Unknown/abstention proportion: 0.038 +/- 0.018 (in 2 folds) ROC-AUC (weighted OvO): 0.673 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.673 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.824 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.824 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.670 MCC: 0.275 Unknown/abstention proportion: 0.026 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.56 0.47 0.51 40  Unknown 0.00 0.00 0.00 0  under 50 0.74 0.77 0.76 75  accuracy 0.67 115  macro avg 0.43 0.42 0.42 115 weighted avg 0.68 0.67 0.67 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.626 +/- 0.063 (in 3 folds) ROC-AUC (macro OvO): 0.626 +/- 0.063 (in 3 folds) au-PRC (weighted OvO): 0.760 +/- 0.045 (in 3 folds) au-PRC (macro OvO): 0.760 +/- 0.045 (in 3 folds) Accuracy: 0.679 +/- 0.065 (in 3 folds) MCC: 0.233 +/- 0.148 (in 3 folds) Global scores without abstention: Accuracy: 0.679 MCC: 0.238 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.662 +/- 0.070 (in 3 folds) MCC: 0.216 +/- 0.140 (in 3 folds) Unknown/abstention proportion: 0.038 +/- 0.018 (in 2 folds) ROC-AUC (weighted OvO): 0.556 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.556 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.781 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.781 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.661 MCC: 0.221 Unknown/abstention proportion: 0.026 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.56 0.35 0.43 40  Unknown 0.00 0.00 0.00 0  under 50 0.71 0.83 0.77 75  accuracy 0.66 115  macro avg 0.42 0.39 0.40 115 weighted avg 0.66 0.66 0.65 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.585 +/- 0.027 (in 2 folds) ROC-AUC (macro OvO): 0.585 +/- 0.027 (in 2 folds) au-PRC (weighted OvO): 0.671 +/- 0.066 (in 2 folds) au-PRC (macro OvO): 0.671 +/- 0.066 (in 2 folds) Accuracy: 0.713 +/- 0.172 (in 3 folds) MCC: 0.114 +/- 0.104 (in 3 folds) Global scores without abstention: Accuracy: 0.651 MCC: 0.206 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.483 +/- 0.184 (in 3 folds) MCC: 0.161 +/- 0.021 (in 3 folds) Unknown/abstention proportion: 0.390 +/- 0.442 (in 2 folds) ROC-AUC (weighted OvO): 0.567 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.567 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.625 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.625 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.487 MCC: 0.138 Unknown/abstention proportion: 0.252 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.46 0.33 0.38 40  Unknown 0.00 0.00 0.00 0  under 50 0.74 0.57 0.65 75  accuracy 0.49 115  macro avg 0.40 0.30 0.34 115 weighted avg 0.64 0.49 0.55 115
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 2 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 2 folds) au-PRC (weighted OvO): 0.631 +/- 0.051 (in 2 folds) au-PRC (macro OvO): 0.631 +/- 0.051 (in 2 folds) Accuracy: 0.754 +/- 0.216 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.679 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.492 +/- 0.171 (in 3 folds) MCC: 0.078 +/- 0.116 (in 3 folds) Unknown/abstention proportion: 0.277 +/- 0.369 (in 3 folds) Global scores with abstention: Accuracy: 0.496 MCC: 0.046 Unknown/abstention proportion: 0.270 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.00 0.00 0.00 40  Unknown 0.00 0.00 0.00 0  under 50 0.68 0.76 0.72 75  accuracy 0.50 115  macro avg 0.23 0.25 0.24 115 weighted avg 0.44 0.50 0.47 115


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.715 +/- 0.105 (in 3 folds),0.715 +/- 0.105 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.671 +/- 0.086 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.651,0.0,,,,,0.498 +/- 0.185 (in 3 folds),0.003 +/- 0.064 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.497,0.004,0.236,Unknown,126.0,39.0,165.0,0.236364,True
ridge_cv.decision_thresholds_tuned,0.715 +/- 0.105 (in 3 folds),0.715 +/- 0.105 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.631 +/- 0.149 (in 3 folds),-0.061 +/- 0.106 (in 3 folds),0.603,-0.068,,,,,0.458 +/- 0.171 (in 3 folds),-0.039 +/- 0.131 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.461,-0.028,0.236,Unknown,126.0,39.0,165.0,0.236364,False
lasso_cv,0.710 +/- 0.101 (in 3 folds),0.710 +/- 0.101 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.631 +/- 0.149 (in 3 folds),-0.061 +/- 0.106 (in 3 folds),0.603,-0.068,,,,,0.458 +/- 0.171 (in 3 folds),-0.039 +/- 0.131 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.461,-0.028,0.236,Unknown,126.0,39.0,165.0,0.236364,False
lasso_cv.decision_thresholds_tuned,0.710 +/- 0.101 (in 3 folds),0.710 +/- 0.101 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.571 +/- 0.165 (in 3 folds),0.036 +/- 0.240 (in 3 folds),0.524,0.035,,,,,0.401 +/- 0.100 (in 3 folds),0.043 +/- 0.215 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.4,0.023,0.236,Unknown,126.0,39.0,165.0,0.236364,False
elasticnet_cv,0.708 +/- 0.097 (in 3 folds),0.708 +/- 0.097 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.651 +/- 0.116 (in 3 folds),-0.034 +/- 0.059 (in 3 folds),0.627,-0.032,,,,,0.478 +/- 0.175 (in 3 folds),-0.014 +/- 0.090 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.479,-0.009,0.236,Unknown,126.0,39.0,165.0,0.236364,False
elasticnet_cv.decision_thresholds_tuned,0.708 +/- 0.097 (in 3 folds),0.708 +/- 0.097 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.565 +/- 0.170 (in 3 folds),0.029 +/- 0.228 (in 3 folds),0.516,0.023,,,,,0.395 +/- 0.096 (in 3 folds),0.036 +/- 0.205 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.394,0.016,0.236,Unknown,126.0,39.0,165.0,0.236364,False
linearsvm_ovr,0.705 +/- 0.095 (in 3 folds),0.705 +/- 0.095 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.635 +/- 0.147 (in 3 folds),0.168 +/- 0.309 (in 3 folds),0.642,0.178,0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),0.896 +/- 0.000 (in 1 folds),0.896 +/- 0.000 (in 1 folds),0.624 +/- 0.149 (in 3 folds),0.162 +/- 0.306 (in 3 folds),0.027 +/- 0.010 (in 2 folds),0.63,0.17,0.018,Unknown,162.0,3.0,165.0,0.018182,False
linearsvm_ovr.decision_thresholds_tuned,0.705 +/- 0.095 (in 3 folds),0.705 +/- 0.095 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.593 +/- 0.122 (in 3 folds),0.144 +/- 0.289 (in 3 folds),0.599,0.145,0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),0.896 +/- 0.000 (in 1 folds),0.896 +/- 0.000 (in 1 folds),0.584 +/- 0.127 (in 3 folds),0.137 +/- 0.286 (in 3 folds),0.027 +/- 0.010 (in 2 folds),0.588,0.14,0.018,Unknown,162.0,3.0,165.0,0.018182,False
lasso_multiclass,0.673 +/- 0.092 (in 3 folds),0.673 +/- 0.092 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.643 +/- 0.099 (in 3 folds),0.187 +/- 0.227 (in 3 folds),0.648,0.195,0.711 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.855 +/- 0.000 (in 1 folds),0.855 +/- 0.000 (in 1 folds),0.632 +/- 0.100 (in 3 folds),0.179 +/- 0.228 (in 3 folds),0.027 +/- 0.010 (in 2 folds),0.636,0.187,0.018,Unknown,162.0,3.0,165.0,0.018182,False
lasso_multiclass.decision_thresholds_tuned,0.673 +/- 0.092 (in 3 folds),0.673 +/- 0.092 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.552 +/- 0.071 (in 3 folds),0.110 +/- 0.254 (in 3 folds),0.556,0.101,0.711 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.855 +/- 0.000 (in 1 folds),0.855 +/- 0.000 (in 1 folds),0.542 +/- 0.071 (in 3 folds),0.104 +/- 0.250 (in 3 folds),0.027 +/- 0.010 (in 2 folds),0.545,0.098,0.018,Unknown,162.0,3.0,165.0,0.018182,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.715 +/- 0.105 (in 3 folds),0.715 +/- 0.105 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.671 +/- 0.086 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.651,0.0,,,,,0.498 +/- 0.185 (in 3 folds),0.003 +/- 0.064 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.497,0.004,0.236,Unknown,126,39,165,0.236364,True
ridge_cv.decision_thresholds_tuned,0.715 +/- 0.105 (in 3 folds),0.715 +/- 0.105 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.850 +/- 0.076 (in 3 folds),0.631 +/- 0.149 (in 3 folds),-0.061 +/- 0.106 (in 3 folds),0.603,-0.068,,,,,0.458 +/- 0.171 (in 3 folds),-0.039 +/- 0.131 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.461,-0.028,0.236,Unknown,126,39,165,0.236364,False
lasso_cv,0.710 +/- 0.101 (in 3 folds),0.710 +/- 0.101 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.631 +/- 0.149 (in 3 folds),-0.061 +/- 0.106 (in 3 folds),0.603,-0.068,,,,,0.458 +/- 0.171 (in 3 folds),-0.039 +/- 0.131 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.461,-0.028,0.236,Unknown,126,39,165,0.236364,False
lasso_cv.decision_thresholds_tuned,0.710 +/- 0.101 (in 3 folds),0.710 +/- 0.101 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.847 +/- 0.074 (in 3 folds),0.571 +/- 0.165 (in 3 folds),0.036 +/- 0.240 (in 3 folds),0.524,0.035,,,,,0.401 +/- 0.100 (in 3 folds),0.043 +/- 0.215 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.4,0.023,0.236,Unknown,126,39,165,0.236364,False
elasticnet_cv,0.708 +/- 0.097 (in 3 folds),0.708 +/- 0.097 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.651 +/- 0.116 (in 3 folds),-0.034 +/- 0.059 (in 3 folds),0.627,-0.032,,,,,0.478 +/- 0.175 (in 3 folds),-0.014 +/- 0.090 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.479,-0.009,0.236,Unknown,126,39,165,0.236364,False
elasticnet_cv.decision_thresholds_tuned,0.708 +/- 0.097 (in 3 folds),0.708 +/- 0.097 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.565 +/- 0.170 (in 3 folds),0.029 +/- 0.228 (in 3 folds),0.516,0.023,,,,,0.395 +/- 0.096 (in 3 folds),0.036 +/- 0.205 (in 3 folds),0.232 +/- 0.341 (in 3 folds),0.394,0.016,0.236,Unknown,126,39,165,0.236364,False
linearsvm_ovr,0.705 +/- 0.095 (in 3 folds),0.705 +/- 0.095 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.635 +/- 0.147 (in 3 folds),0.168 +/- 0.309 (in 3 folds),0.642,0.178,0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),0.896 +/- 0.000 (in 1 folds),0.896 +/- 0.000 (in 1 folds),0.624 +/- 0.149 (in 3 folds),0.162 +/- 0.306 (in 3 folds),0.027 +/- 0.010 (in 2 folds),0.63,0.17,0.018,Unknown,162,3,165,0.018182,False
linearsvm_ovr.decision_thresholds_tuned,0.705 +/- 0.095 (in 3 folds),0.705 +/- 0.095 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.840 +/- 0.077 (in 3 folds),0.593 +/- 0.122 (in 3 folds),0.144 +/- 0.289 (in 3 folds),0.599,0.145,0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),0.896 +/- 0.000 (in 1 folds),0.896 +/- 0.000 (in 1 folds),0.584 +/- 0.127 (in 3 folds),0.137 +/- 0.286 (in 3 folds),0.027 +/- 0.010 (in 2 folds),0.588,0.14,0.018,Unknown,162,3,165,0.018182,False
lasso_multiclass,0.673 +/- 0.092 (in 3 folds),0.673 +/- 0.092 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.643 +/- 0.099 (in 3 folds),0.187 +/- 0.227 (in 3 folds),0.648,0.195,0.711 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.855 +/- 0.000 (in 1 folds),0.855 +/- 0.000 (in 1 folds),0.632 +/- 0.100 (in 3 folds),0.179 +/- 0.228 (in 3 folds),0.027 +/- 0.010 (in 2 folds),0.636,0.187,0.018,Unknown,162,3,165,0.018182,False
lasso_multiclass.decision_thresholds_tuned,0.673 +/- 0.092 (in 3 folds),0.673 +/- 0.092 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.818 +/- 0.079 (in 3 folds),0.552 +/- 0.071 (in 3 folds),0.110 +/- 0.254 (in 3 folds),0.556,0.101,0.711 +/- 0.000 (in 1 folds),0.711 +/- 0.000 (in 1 folds),0.855 +/- 0.000 (in 1 folds),0.855 +/- 0.000 (in 1 folds),0.542 +/- 0.071 (in 3 folds),0.104 +/- 0.250 (in 3 folds),0.027 +/- 0.010 (in 2 folds),0.545,0.098,0.018,Unknown,162,3,165,0.018182,False


ridge_cv,ridge_cv.decision_thresholds_tuned,lasso_cv,lasso_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.715 +/- 0.105 (in 3 folds) ROC-AUC (macro OvO): 0.715 +/- 0.105 (in 3 folds) au-PRC (weighted OvO): 0.850 +/- 0.076 (in 3 folds) au-PRC (macro OvO): 0.850 +/- 0.076 (in 3 folds) Accuracy: 0.671 +/- 0.086 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.651 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.498 +/- 0.185 (in 3 folds) MCC: 0.003 +/- 0.064 (in 3 folds) Unknown/abstention proportion: 0.232 +/- 0.341 (in 3 folds) Global scores with abstention: Accuracy: 0.497 MCC: 0.004 Unknown/abstention proportion: 0.236 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.00 0.00 0.00 58  Unknown 0.00 0.00 0.00 0  under 50 0.65 0.77 0.70 107  accuracy 0.50 165  macro avg 0.22 0.26 0.23 165 weighted avg 0.42 0.50 0.46 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.715 +/- 0.105 (in 3 folds) ROC-AUC (macro OvO): 0.715 +/- 0.105 (in 3 folds) au-PRC (weighted OvO): 0.850 +/- 0.076 (in 3 folds) au-PRC (macro OvO): 0.850 +/- 0.076 (in 3 folds) Accuracy: 0.631 +/- 0.149 (in 3 folds) MCC: -0.061 +/- 0.106 (in 3 folds) Global scores without abstention: Accuracy: 0.603 MCC: -0.068 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.458 +/- 0.171 (in 3 folds) MCC: -0.039 +/- 0.131 (in 3 folds) Unknown/abstention proportion: 0.232 +/- 0.341 (in 3 folds) Global scores with abstention: Accuracy: 0.461 MCC: -0.028 Unknown/abstention proportion: 0.236 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.25 0.05 0.09 58  Unknown 0.00 0.00 0.00 0  under 50 0.64 0.68 0.66 107  accuracy 0.46 165  macro avg 0.30 0.24 0.25 165 weighted avg 0.50 0.46 0.46 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.710 +/- 0.101 (in 3 folds) ROC-AUC (macro OvO): 0.710 +/- 0.101 (in 3 folds) au-PRC (weighted OvO): 0.847 +/- 0.074 (in 3 folds) au-PRC (macro OvO): 0.847 +/- 0.074 (in 3 folds) Accuracy: 0.631 +/- 0.149 (in 3 folds) MCC: -0.061 +/- 0.106 (in 3 folds) Global scores without abstention: Accuracy: 0.603 MCC: -0.068 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.458 +/- 0.171 (in 3 folds) MCC: -0.039 +/- 0.131 (in 3 folds) Unknown/abstention proportion: 0.232 +/- 0.341 (in 3 folds) Global scores with abstention: Accuracy: 0.461 MCC: -0.028 Unknown/abstention proportion: 0.236 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.25 0.05 0.09 58  Unknown 0.00 0.00 0.00 0  under 50 0.64 0.68 0.66 107  accuracy 0.46 165  macro avg 0.30 0.24 0.25 165 weighted avg 0.50 0.46 0.46 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.710 +/- 0.101 (in 3 folds) ROC-AUC (macro OvO): 0.710 +/- 0.101 (in 3 folds) au-PRC (weighted OvO): 0.847 +/- 0.074 (in 3 folds) au-PRC (macro OvO): 0.847 +/- 0.074 (in 3 folds) Accuracy: 0.571 +/- 0.165 (in 3 folds) MCC: 0.036 +/- 0.240 (in 3 folds) Global scores without abstention: Accuracy: 0.524 MCC: 0.035 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.401 +/- 0.100 (in 3 folds) MCC: 0.043 +/- 0.215 (in 3 folds) Unknown/abstention proportion: 0.232 +/- 0.341 (in 3 folds) Global scores with abstention: Accuracy: 0.400 MCC: 0.023 Unknown/abstention proportion: 0.236 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.37 0.38 0.37 58  Unknown 0.00 0.00 0.00 0  under 50 0.67 0.41 0.51 107  accuracy 0.40 165  macro avg 0.34 0.26 0.29 165 weighted avg 0.56 0.40 0.46 165
,,,


elasticnet_cv,elasticnet_cv.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.708 +/- 0.097 (in 3 folds) ROC-AUC (macro OvO): 0.708 +/- 0.097 (in 3 folds) au-PRC (weighted OvO): 0.840 +/- 0.077 (in 3 folds) au-PRC (macro OvO): 0.840 +/- 0.077 (in 3 folds) Accuracy: 0.651 +/- 0.116 (in 3 folds) MCC: -0.034 +/- 0.059 (in 3 folds) Global scores without abstention: Accuracy: 0.627 MCC: -0.032 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.478 +/- 0.175 (in 3 folds) MCC: -0.014 +/- 0.090 (in 3 folds) Unknown/abstention proportion: 0.232 +/- 0.341 (in 3 folds) Global scores with abstention: Accuracy: 0.479 MCC: -0.009 Unknown/abstention proportion: 0.236 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.29 0.03 0.06 58  Unknown 0.00 0.00 0.00 0  under 50 0.65 0.72 0.68 107  accuracy 0.48 165  macro avg 0.31 0.25 0.25 165 weighted avg 0.52 0.48 0.46 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.708 +/- 0.097 (in 3 folds) ROC-AUC (macro OvO): 0.708 +/- 0.097 (in 3 folds) au-PRC (weighted OvO): 0.840 +/- 0.077 (in 3 folds) au-PRC (macro OvO): 0.840 +/- 0.077 (in 3 folds) Accuracy: 0.565 +/- 0.170 (in 3 folds) MCC: 0.029 +/- 0.228 (in 3 folds) Global scores without abstention: Accuracy: 0.516 MCC: 0.023 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.395 +/- 0.096 (in 3 folds) MCC: 0.036 +/- 0.205 (in 3 folds) Unknown/abstention proportion: 0.232 +/- 0.341 (in 3 folds) Global scores with abstention: Accuracy: 0.394 MCC: 0.016 Unknown/abstention proportion: 0.236 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.36 0.38 0.37 58  Unknown 0.00 0.00 0.00 0  under 50 0.66 0.40 0.50 107  accuracy 0.39 165  macro avg 0.34 0.26 0.29 165 weighted avg 0.56 0.39 0.45 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.705 +/- 0.095 (in 3 folds) ROC-AUC (macro OvO): 0.705 +/- 0.095 (in 3 folds) au-PRC (weighted OvO): 0.840 +/- 0.077 (in 3 folds) au-PRC (macro OvO): 0.840 +/- 0.077 (in 3 folds) Accuracy: 0.635 +/- 0.147 (in 3 folds) MCC: 0.168 +/- 0.309 (in 3 folds) Global scores without abstention: Accuracy: 0.642 MCC: 0.178 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.778 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.778 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.896 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.896 +/- 0.000 (in 1 folds) Accuracy: 0.624 +/- 0.149 (in 3 folds) MCC: 0.162 +/- 0.306 (in 3 folds) Unknown/abstention proportion: 0.027 +/- 0.010 (in 2 folds) Global scores with abstention: Accuracy: 0.630 MCC: 0.170 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.49 0.38 0.43 58  Unknown 0.00 0.00 0.00 0  under 50 0.70 0.77 0.73 107  accuracy 0.63 165  macro avg 0.40 0.38 0.39 165 weighted avg 0.63 0.63 0.62 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.705 +/- 0.095 (in 3 folds) ROC-AUC (macro OvO): 0.705 +/- 0.095 (in 3 folds) au-PRC (weighted OvO): 0.840 +/- 0.077 (in 3 folds) au-PRC (macro OvO): 0.840 +/- 0.077 (in 3 folds) Accuracy: 0.593 +/- 0.122 (in 3 folds) MCC: 0.144 +/- 0.289 (in 3 folds) Global scores without abstention: Accuracy: 0.599 MCC: 0.145 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.778 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.778 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.896 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.896 +/- 0.000 (in 1 folds) Accuracy: 0.584 +/- 0.127 (in 3 folds) MCC: 0.137 +/- 0.286 (in 3 folds) Unknown/abstention proportion: 0.027 +/- 0.010 (in 2 folds) Global scores with abstention: Accuracy: 0.588 MCC: 0.140 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.44 0.48 0.46 58  Unknown 0.00 0.00 0.00 0  under 50 0.70 0.64 0.67 107  accuracy 0.59 165  macro avg 0.38 0.38 0.38 165 weighted avg 0.61 0.59 0.60 165
,,,


lasso_multiclass,lasso_multiclass.decision_thresholds_tuned,rf_multiclass,rf_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.673 +/- 0.092 (in 3 folds) ROC-AUC (macro OvO): 0.673 +/- 0.092 (in 3 folds) au-PRC (weighted OvO): 0.818 +/- 0.079 (in 3 folds) au-PRC (macro OvO): 0.818 +/- 0.079 (in 3 folds) Accuracy: 0.643 +/- 0.099 (in 3 folds) MCC: 0.187 +/- 0.227 (in 3 folds) Global scores without abstention: Accuracy: 0.648 MCC: 0.195 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.711 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.711 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.855 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.855 +/- 0.000 (in 1 folds) Accuracy: 0.632 +/- 0.100 (in 3 folds) MCC: 0.179 +/- 0.228 (in 3 folds) Unknown/abstention proportion: 0.027 +/- 0.010 (in 2 folds) Global scores with abstention: Accuracy: 0.636 MCC: 0.187 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.50 0.40 0.44 58  Unknown 0.00 0.00 0.00 0  under 50 0.71 0.77 0.74 107  accuracy 0.64 165  macro avg 0.40 0.39 0.39 165 weighted avg 0.63 0.64 0.63 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.673 +/- 0.092 (in 3 folds) ROC-AUC (macro OvO): 0.673 +/- 0.092 (in 3 folds) au-PRC (weighted OvO): 0.818 +/- 0.079 (in 3 folds) au-PRC (macro OvO): 0.818 +/- 0.079 (in 3 folds) Accuracy: 0.552 +/- 0.071 (in 3 folds) MCC: 0.110 +/- 0.254 (in 3 folds) Global scores without abstention: Accuracy: 0.556 MCC: 0.101 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.711 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.711 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.855 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.855 +/- 0.000 (in 1 folds) Accuracy: 0.542 +/- 0.071 (in 3 folds) MCC: 0.104 +/- 0.250 (in 3 folds) Unknown/abstention proportion: 0.027 +/- 0.010 (in 2 folds) Global scores with abstention: Accuracy: 0.545 MCC: 0.098 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.40 0.53 0.46 58  Unknown 0.00 0.00 0.00 0  under 50 0.69 0.55 0.61 107  accuracy 0.55 165  macro avg 0.37 0.36 0.36 165 weighted avg 0.59 0.55 0.56 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.603 +/- 0.172 (in 3 folds) ROC-AUC (macro OvO): 0.603 +/- 0.172 (in 3 folds) au-PRC (weighted OvO): 0.720 +/- 0.159 (in 3 folds) au-PRC (macro OvO): 0.720 +/- 0.159 (in 3 folds) Accuracy: 0.655 +/- 0.108 (in 3 folds) MCC: 0.169 +/- 0.239 (in 3 folds) Global scores without abstention: Accuracy: 0.660 MCC: 0.181 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.711 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.711 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.828 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.828 +/- 0.000 (in 1 folds) Accuracy: 0.643 +/- 0.107 (in 3 folds) MCC: 0.159 +/- 0.236 (in 3 folds) Unknown/abstention proportion: 0.027 +/- 0.010 (in 2 folds) Global scores with abstention: Accuracy: 0.648 MCC: 0.170 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.53 0.28 0.36 58  Unknown 0.00 0.00 0.00 0  under 50 0.69 0.85 0.76 107  accuracy 0.65 165  macro avg 0.41 0.38 0.38 165 weighted avg 0.63 0.65 0.62 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.603 +/- 0.172 (in 3 folds) ROC-AUC (macro OvO): 0.603 +/- 0.172 (in 3 folds) au-PRC (weighted OvO): 0.720 +/- 0.159 (in 3 folds) au-PRC (macro OvO): 0.720 +/- 0.159 (in 3 folds) Accuracy: 0.593 +/- 0.132 (in 3 folds) MCC: 0.121 +/- 0.293 (in 3 folds) Global scores without abstention: Accuracy: 0.599 MCC: 0.110 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.711 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.711 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.828 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.828 +/- 0.000 (in 1 folds) Accuracy: 0.584 +/- 0.138 (in 3 folds) MCC: 0.114 +/- 0.288 (in 3 folds) Unknown/abstention proportion: 0.027 +/- 0.010 (in 2 folds) Global scores with abstention: Accuracy: 0.588 MCC: 0.105 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.43 0.40 0.41 58  Unknown 0.00 0.00 0.00 0  under 50 0.69 0.69 0.69 107  accuracy 0.59 165  macro avg 0.37 0.36 0.37 165 weighted avg 0.59 0.59 0.59 165
,,,


xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.601 +/- 0.199 (in 3 folds) ROC-AUC (macro OvO): 0.601 +/- 0.199 (in 3 folds) au-PRC (weighted OvO): 0.729 +/- 0.174 (in 3 folds) au-PRC (macro OvO): 0.729 +/- 0.174 (in 3 folds) Accuracy: 0.615 +/- 0.161 (in 3 folds) MCC: 0.112 +/- 0.314 (in 3 folds) Global scores without abstention: Accuracy: 0.623 MCC: 0.118 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.708 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.708 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.809 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.809 +/- 0.000 (in 1 folds) Accuracy: 0.604 +/- 0.160 (in 3 folds) MCC: 0.106 +/- 0.306 (in 3 folds) Unknown/abstention proportion: 0.027 +/- 0.010 (in 2 folds) Global scores with abstention: Accuracy: 0.612 MCC: 0.112 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.45 0.31 0.37 58  Unknown 0.00 0.00 0.00 0  under 50 0.68 0.78 0.72 107  accuracy 0.61 165  macro avg 0.38 0.36 0.36 165 weighted avg 0.60 0.61 0.60 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.601 +/- 0.199 (in 3 folds) ROC-AUC (macro OvO): 0.601 +/- 0.199 (in 3 folds) au-PRC (weighted OvO): 0.729 +/- 0.174 (in 3 folds) au-PRC (macro OvO): 0.729 +/- 0.174 (in 3 folds) Accuracy: 0.597 +/- 0.155 (in 3 folds) MCC: 0.116 +/- 0.317 (in 3 folds) Global scores without abstention: Accuracy: 0.605 MCC: 0.113 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.708 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.708 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.809 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.809 +/- 0.000 (in 1 folds) Accuracy: 0.587 +/- 0.157 (in 3 folds) MCC: 0.111 +/- 0.311 (in 3 folds) Unknown/abstention proportion: 0.027 +/- 0.010 (in 2 folds) Global scores with abstention: Accuracy: 0.594 MCC: 0.108 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  50+ 0.43 0.38 0.40 58  Unknown 0.00 0.00 0.00 0  under 50 0.68 0.71 0.70 107  accuracy 0.59 165  macro avg 0.37 0.36 0.37 165 weighted avg 0.60 0.59 0.59 165
,


---

# GeneLocus.TCR, TargetObsColumnEnum.age_group_pediatric_healthy_only trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention
linearsvm_ovr,0.954 +/- 0.024 (in 3 folds),0.954 +/- 0.024 (in 3 folds),0.885 +/- 0.042 (in 3 folds),0.885 +/- 0.042 (in 3 folds),0.948 +/- 0.044 (in 3 folds),0.825 +/- 0.113 (in 3 folds),0.947,0.81,114.0,1.0,115.0,0.008696,False,0.940 +/- 0.039 (in 3 folds),0.790 +/- 0.102 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.939 +/- 0.002 (in 2 folds),0.939 +/- 0.002 (in 2 folds),0.865 +/- 0.034 (in 2 folds),0.865 +/- 0.034 (in 2 folds),0.939,0.78,0.009,Unknown
lasso_multiclass,0.953 +/- 0.041 (in 3 folds),0.953 +/- 0.041 (in 3 folds),0.898 +/- 0.097 (in 3 folds),0.898 +/- 0.097 (in 3 folds),0.939 +/- 0.058 (in 3 folds),0.796 +/- 0.162 (in 3 folds),0.938,0.775,113.0,2.0,115.0,0.017391,False,0.923 +/- 0.051 (in 3 folds),0.736 +/- 0.148 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.930 +/- 0.011 (in 2 folds),0.930 +/- 0.011 (in 2 folds),0.847 +/- 0.059 (in 2 folds),0.847 +/- 0.059 (in 2 folds),0.922,0.719,0.017,Unknown
xgboost,0.939 +/- 0.032 (in 3 folds),0.939 +/- 0.032 (in 3 folds),0.832 +/- 0.078 (in 3 folds),0.832 +/- 0.078 (in 3 folds),0.939 +/- 0.059 (in 3 folds),0.796 +/- 0.162 (in 3 folds),0.939,0.776,114.0,1.0,115.0,0.008696,False,0.931 +/- 0.053 (in 3 folds),0.762 +/- 0.145 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.921 +/- 0.007 (in 2 folds),0.921 +/- 0.007 (in 2 folds),0.802 +/- 0.082 (in 2 folds),0.802 +/- 0.082 (in 2 folds),0.93,0.746,0.009,Unknown
lasso_cv,0.936 +/- 0.006 (in 3 folds),0.936 +/- 0.006 (in 3 folds),0.863 +/- 0.024 (in 3 folds),0.863 +/- 0.024 (in 3 folds),0.826 +/- 0.052 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.826,0.0,115.0,0.0,115.0,0.0,True,,,,,,,,,,,
elasticnet_cv,0.936 +/- 0.006 (in 3 folds),0.936 +/- 0.006 (in 3 folds),0.863 +/- 0.024 (in 3 folds),0.863 +/- 0.024 (in 3 folds),0.826 +/- 0.052 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.826,0.0,115.0,0.0,115.0,0.0,True,,,,,,,,,,,
ridge_cv,0.895 +/- 0.077 (in 3 folds),0.895 +/- 0.077 (in 3 folds),0.790 +/- 0.131 (in 3 folds),0.790 +/- 0.131 (in 3 folds),0.826 +/- 0.052 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.826,0.0,115.0,0.0,115.0,0.0,True,,,,,,,,,,,
rf_multiclass,0.877 +/- 0.052 (in 3 folds),0.877 +/- 0.052 (in 3 folds),0.786 +/- 0.100 (in 3 folds),0.786 +/- 0.100 (in 3 folds),0.939 +/- 0.059 (in 3 folds),0.796 +/- 0.162 (in 3 folds),0.939,0.776,114.0,1.0,115.0,0.008696,False,0.931 +/- 0.053 (in 3 folds),0.762 +/- 0.145 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.866 +/- 0.068 (in 2 folds),0.866 +/- 0.068 (in 2 folds),0.766 +/- 0.133 (in 2 folds),0.766 +/- 0.133 (in 2 folds),0.93,0.746,0.009,Unknown
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.174 +/- 0.052 (in 3 folds),0.174 +/- 0.052 (in 3 folds),0.826 +/- 0.052 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.826,0.0,115.0,0.0,115.0,0.0,True,,,,,,,,,,,
dummy_stratified,0.425 +/- 0.106 (in 3 folds),0.425 +/- 0.106 (in 3 folds),0.171 +/- 0.046 (in 3 folds),0.171 +/- 0.046 (in 3 folds),0.633 +/- 0.115 (in 3 folds),-0.127 +/- 0.165 (in 3 folds),0.635,-0.138,115.0,0.0,115.0,0.0,False,,,,,,,,,,,
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention
linearsvm_ovr,0.954 +/- 0.024 (in 3 folds),0.954 +/- 0.024 (in 3 folds),0.885 +/- 0.042 (in 3 folds),0.885 +/- 0.042 (in 3 folds),0.948 +/- 0.044 (in 3 folds),0.825 +/- 0.113 (in 3 folds),0.947,0.81,114,1,115,0.008696,False,0.940 +/- 0.039 (in 3 folds),0.790 +/- 0.102 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.939 +/- 0.002 (in 2 folds),0.939 +/- 0.002 (in 2 folds),0.865 +/- 0.034 (in 2 folds),0.865 +/- 0.034 (in 2 folds),0.939,0.78,0.009,Unknown
lasso_multiclass,0.953 +/- 0.041 (in 3 folds),0.953 +/- 0.041 (in 3 folds),0.898 +/- 0.097 (in 3 folds),0.898 +/- 0.097 (in 3 folds),0.939 +/- 0.058 (in 3 folds),0.796 +/- 0.162 (in 3 folds),0.938,0.775,113,2,115,0.017391,False,0.923 +/- 0.051 (in 3 folds),0.736 +/- 0.148 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.930 +/- 0.011 (in 2 folds),0.930 +/- 0.011 (in 2 folds),0.847 +/- 0.059 (in 2 folds),0.847 +/- 0.059 (in 2 folds),0.922,0.719,0.017,Unknown
xgboost,0.939 +/- 0.032 (in 3 folds),0.939 +/- 0.032 (in 3 folds),0.832 +/- 0.078 (in 3 folds),0.832 +/- 0.078 (in 3 folds),0.939 +/- 0.059 (in 3 folds),0.796 +/- 0.162 (in 3 folds),0.939,0.776,114,1,115,0.008696,False,0.931 +/- 0.053 (in 3 folds),0.762 +/- 0.145 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.921 +/- 0.007 (in 2 folds),0.921 +/- 0.007 (in 2 folds),0.802 +/- 0.082 (in 2 folds),0.802 +/- 0.082 (in 2 folds),0.93,0.746,0.009,Unknown
lasso_cv,0.936 +/- 0.006 (in 3 folds),0.936 +/- 0.006 (in 3 folds),0.863 +/- 0.024 (in 3 folds),0.863 +/- 0.024 (in 3 folds),0.826 +/- 0.052 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.826,0.0,115,0,115,0.0,True,,,,,,,,,,,
elasticnet_cv,0.936 +/- 0.006 (in 3 folds),0.936 +/- 0.006 (in 3 folds),0.863 +/- 0.024 (in 3 folds),0.863 +/- 0.024 (in 3 folds),0.826 +/- 0.052 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.826,0.0,115,0,115,0.0,True,,,,,,,,,,,
ridge_cv,0.895 +/- 0.077 (in 3 folds),0.895 +/- 0.077 (in 3 folds),0.790 +/- 0.131 (in 3 folds),0.790 +/- 0.131 (in 3 folds),0.826 +/- 0.052 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.826,0.0,115,0,115,0.0,True,,,,,,,,,,,
rf_multiclass,0.877 +/- 0.052 (in 3 folds),0.877 +/- 0.052 (in 3 folds),0.786 +/- 0.100 (in 3 folds),0.786 +/- 0.100 (in 3 folds),0.939 +/- 0.059 (in 3 folds),0.796 +/- 0.162 (in 3 folds),0.939,0.776,114,1,115,0.008696,False,0.931 +/- 0.053 (in 3 folds),0.762 +/- 0.145 (in 3 folds),0.026 +/- 0.000 (in 1 folds),0.866 +/- 0.068 (in 2 folds),0.866 +/- 0.068 (in 2 folds),0.766 +/- 0.133 (in 2 folds),0.766 +/- 0.133 (in 2 folds),0.93,0.746,0.009,Unknown
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.174 +/- 0.052 (in 3 folds),0.174 +/- 0.052 (in 3 folds),0.826 +/- 0.052 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.826,0.0,115,0,115,0.0,True,,,,,,,,,,,
dummy_stratified,0.425 +/- 0.106 (in 3 folds),0.425 +/- 0.106 (in 3 folds),0.171 +/- 0.046 (in 3 folds),0.171 +/- 0.046 (in 3 folds),0.633 +/- 0.115 (in 3 folds),-0.127 +/- 0.165 (in 3 folds),0.635,-0.138,115,0,115,0.0,False,,,,,,,,,,,


linearsvm_ovr,lasso_multiclass,xgboost,lasso_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.954 +/- 0.024 (in 3 folds) ROC-AUC (macro OvO): 0.954 +/- 0.024 (in 3 folds) au-PRC (weighted OvO): 0.885 +/- 0.042 (in 3 folds) au-PRC (macro OvO): 0.885 +/- 0.042 (in 3 folds) Accuracy: 0.948 +/- 0.044 (in 3 folds) MCC: 0.825 +/- 0.113 (in 3 folds) Global scores without abstention: Accuracy: 0.947 MCC: 0.810 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.940 +/- 0.039 (in 3 folds) MCC: 0.790 +/- 0.102 (in 3 folds) Unknown/abstention proportion: 0.026 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.939 +/- 0.002 (in 2 folds) ROC-AUC (macro OvO): 0.939 +/- 0.002 (in 2 folds) au-PRC (weighted OvO): 0.865 +/- 0.034 (in 2 folds) au-PRC (macro OvO): 0.865 +/- 0.034 (in 2 folds) Global scores with abstention: Accuracy: 0.939 MCC: 0.780 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.95 0.98 0.96 95  Unknown 0.00 0.00 0.00 0  under 18 0.94 0.75 0.83 20  accuracy 0.94 115  macro avg 0.63 0.58 0.60 115 weighted avg 0.95 0.94 0.94 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.953 +/- 0.041 (in 3 folds) ROC-AUC (macro OvO): 0.953 +/- 0.041 (in 3 folds) au-PRC (weighted OvO): 0.898 +/- 0.097 (in 3 folds) au-PRC (macro OvO): 0.898 +/- 0.097 (in 3 folds) Accuracy: 0.939 +/- 0.058 (in 3 folds) MCC: 0.796 +/- 0.162 (in 3 folds) Global scores without abstention: Accuracy: 0.938 MCC: 0.775 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.923 +/- 0.051 (in 3 folds) MCC: 0.736 +/- 0.148 (in 3 folds) Unknown/abstention proportion: 0.051 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.930 +/- 0.011 (in 2 folds) ROC-AUC (macro OvO): 0.930 +/- 0.011 (in 2 folds) au-PRC (weighted OvO): 0.847 +/- 0.059 (in 2 folds) au-PRC (macro OvO): 0.847 +/- 0.059 (in 2 folds) Global scores with abstention: Accuracy: 0.922 MCC: 0.719 Unknown/abstention proportion: 0.017 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.94 0.97 0.95 95  Unknown 0.00 0.00 0.00 0  under 18 0.93 0.70 0.80 20  accuracy 0.92 115  macro avg 0.62 0.56 0.58 115 weighted avg 0.94 0.92 0.93 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.939 +/- 0.032 (in 3 folds) ROC-AUC (macro OvO): 0.939 +/- 0.032 (in 3 folds) au-PRC (weighted OvO): 0.832 +/- 0.078 (in 3 folds) au-PRC (macro OvO): 0.832 +/- 0.078 (in 3 folds) Accuracy: 0.939 +/- 0.059 (in 3 folds) MCC: 0.796 +/- 0.162 (in 3 folds) Global scores without abstention: Accuracy: 0.939 MCC: 0.776 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.931 +/- 0.053 (in 3 folds) MCC: 0.762 +/- 0.145 (in 3 folds) Unknown/abstention proportion: 0.026 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.921 +/- 0.007 (in 2 folds) ROC-AUC (macro OvO): 0.921 +/- 0.007 (in 2 folds) au-PRC (weighted OvO): 0.802 +/- 0.082 (in 2 folds) au-PRC (macro OvO): 0.802 +/- 0.082 (in 2 folds) Global scores with abstention: Accuracy: 0.930 MCC: 0.746 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.94 0.98 0.96 95  Unknown 0.00 0.00 0.00 0  under 18 0.93 0.70 0.80 20  accuracy 0.93 115  macro avg 0.62 0.56 0.59 115 weighted avg 0.94 0.93 0.93 115,Per-fold scores: ROC-AUC (weighted OvO): 0.936 +/- 0.006 (in 3 folds) ROC-AUC (macro OvO): 0.936 +/- 0.006 (in 3 folds) au-PRC (weighted OvO): 0.863 +/- 0.024 (in 3 folds) au-PRC (macro OvO): 0.863 +/- 0.024 (in 3 folds) Accuracy: 0.826 +/- 0.052 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores: Accuracy: 0.826 MCC: 0.000 Global classification report:  precision recall f1-score support  18+ 0.83 1.00 0.90 95  under 18 0.00 0.00 0.00 20  accuracy 0.83 115  macro avg 0.41 0.50 0.45 115 weighted avg 0.68 0.83 0.75 115
,,,


elasticnet_cv,ridge_cv,rf_multiclass,dummy_most_frequent
Per-fold scores: ROC-AUC (weighted OvO): 0.936 +/- 0.006 (in 3 folds) ROC-AUC (macro OvO): 0.936 +/- 0.006 (in 3 folds) au-PRC (weighted OvO): 0.863 +/- 0.024 (in 3 folds) au-PRC (macro OvO): 0.863 +/- 0.024 (in 3 folds) Accuracy: 0.826 +/- 0.052 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores: Accuracy: 0.826 MCC: 0.000 Global classification report:  precision recall f1-score support  18+ 0.83 1.00 0.90 95  under 18 0.00 0.00 0.00 20  accuracy 0.83 115  macro avg 0.41 0.50 0.45 115 weighted avg 0.68 0.83 0.75 115,Per-fold scores: ROC-AUC (weighted OvO): 0.895 +/- 0.077 (in 3 folds) ROC-AUC (macro OvO): 0.895 +/- 0.077 (in 3 folds) au-PRC (weighted OvO): 0.790 +/- 0.131 (in 3 folds) au-PRC (macro OvO): 0.790 +/- 0.131 (in 3 folds) Accuracy: 0.826 +/- 0.052 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores: Accuracy: 0.826 MCC: 0.000 Global classification report:  precision recall f1-score support  18+ 0.83 1.00 0.90 95  under 18 0.00 0.00 0.00 20  accuracy 0.83 115  macro avg 0.41 0.50 0.45 115 weighted avg 0.68 0.83 0.75 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.877 +/- 0.052 (in 3 folds) ROC-AUC (macro OvO): 0.877 +/- 0.052 (in 3 folds) au-PRC (weighted OvO): 0.786 +/- 0.100 (in 3 folds) au-PRC (macro OvO): 0.786 +/- 0.100 (in 3 folds) Accuracy: 0.939 +/- 0.059 (in 3 folds) MCC: 0.796 +/- 0.162 (in 3 folds) Global scores without abstention: Accuracy: 0.939 MCC: 0.776 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.931 +/- 0.053 (in 3 folds) MCC: 0.762 +/- 0.145 (in 3 folds) Unknown/abstention proportion: 0.026 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.866 +/- 0.068 (in 2 folds) ROC-AUC (macro OvO): 0.866 +/- 0.068 (in 2 folds) au-PRC (weighted OvO): 0.766 +/- 0.133 (in 2 folds) au-PRC (macro OvO): 0.766 +/- 0.133 (in 2 folds) Global scores with abstention: Accuracy: 0.930 MCC: 0.746 Unknown/abstention proportion: 0.009 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  18+ 0.94 0.98 0.96 95  Unknown 0.00 0.00 0.00 0  under 18 0.93 0.70 0.80 20  accuracy 0.93 115  macro avg 0.62 0.56 0.59 115 weighted avg 0.94 0.93 0.93 115,Per-fold scores: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.174 +/- 0.052 (in 3 folds) au-PRC (macro OvO): 0.174 +/- 0.052 (in 3 folds) Accuracy: 0.826 +/- 0.052 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores: Accuracy: 0.826 MCC: 0.000 Global classification report:  precision recall f1-score support  18+ 0.83 1.00 0.90 95  under 18 0.00 0.00 0.00 20  accuracy 0.83 115  macro avg 0.41 0.50 0.45 115 weighted avg 0.68 0.83 0.75 115
,,,


dummy_stratified
Per-fold scores: ROC-AUC (weighted OvO): 0.425 +/- 0.106 (in 3 folds) ROC-AUC (macro OvO): 0.425 +/- 0.106 (in 3 folds) au-PRC (weighted OvO): 0.171 +/- 0.046 (in 3 folds) au-PRC (macro OvO): 0.171 +/- 0.046 (in 3 folds) Accuracy: 0.633 +/- 0.115 (in 3 folds) MCC: -0.127 +/- 0.165 (in 3 folds) Global scores: Accuracy: 0.635 MCC: -0.138 Global classification report:  precision recall f1-score support  18+ 0.80 0.75 0.77 95  under 18 0.08 0.10 0.09 20  accuracy 0.63 115  macro avg 0.44 0.42 0.43 115 weighted avg 0.67 0.63 0.65 115


## Apply train-smaller model -- Test set performance - With and without tuning on validation set



---

# GeneLocus.TCR, TargetObsColumnEnum.sex_healthy_only trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
linearsvm_ovr,0.598 +/- 0.035 (in 3 folds),0.598 +/- 0.035 (in 3 folds),0.591 +/- 0.133 (in 3 folds),0.591 +/- 0.133 (in 3 folds),0.576 +/- 0.132 (in 3 folds),0.192 +/- 0.117 (in 3 folds),0.577,0.162,0.556 +/- 0.129 (in 3 folds),0.179 +/- 0.102 (in 3 folds),0.035 +/- 0.016 (in 3 folds),0.557,0.149,0.035,Unknown,111.0,4.0,115.0,0.034783,False,,,,
dummy_stratified,0.598 +/- 0.029 (in 3 folds),0.598 +/- 0.029 (in 3 folds),0.565 +/- 0.170 (in 3 folds),0.565 +/- 0.170 (in 3 folds),0.575 +/- 0.051 (in 3 folds),0.191 +/- 0.064 (in 3 folds),0.574,0.149,0.540 +/- 0.054 (in 3 folds),0.169 +/- 0.059 (in 3 folds),0.061 +/- 0.014 (in 3 folds),0.539,0.133,0.061,Unknown,108.0,7.0,115.0,0.06087,False,,,,
lasso_multiclass,0.594 +/- 0.052 (in 3 folds),0.594 +/- 0.052 (in 3 folds),0.602 +/- 0.132 (in 3 folds),0.602 +/- 0.132 (in 3 folds),0.543 +/- 0.085 (in 3 folds),0.160 +/- 0.070 (in 3 folds),0.541,0.078,0.514 +/- 0.068 (in 3 folds),0.145 +/- 0.050 (in 3 folds),0.052 +/- 0.026 (in 3 folds),0.513,0.07,0.052,Unknown,109.0,6.0,115.0,0.052174,False,,,,
ridge_cv,0.587 +/- 0.064 (in 3 folds),0.587 +/- 0.064 (in 3 folds),0.638 +/- 0.099 (in 3 folds),0.638 +/- 0.099 (in 3 folds),0.393 +/- 0.084 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.393,-0.234,0.384 +/- 0.092 (in 3 folds),0.046 +/- 0.041 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.383,-0.224,0.026,Unknown,112.0,3.0,115.0,0.026087,False,0.567 +/- 0.000 (in 1 folds),0.567 +/- 0.000 (in 1 folds),0.630 +/- 0.000 (in 1 folds),0.630 +/- 0.000 (in 1 folds)
lasso_cv,0.533 +/- 0.044 (in 3 folds),0.533 +/- 0.044 (in 3 folds),0.551 +/- 0.186 (in 3 folds),0.551 +/- 0.186 (in 3 folds),0.523 +/- 0.015 (in 3 folds),0.176 +/- 0.111 (in 3 folds),0.523,0.045,0.495 +/- 0.015 (in 3 folds),0.144 +/- 0.117 (in 3 folds),0.052 +/- 0.002 (in 3 folds),0.496,0.038,0.052,Unknown,109.0,6.0,115.0,0.052174,False,,,,
rf_multiclass,0.524 +/- 0.035 (in 3 folds),0.524 +/- 0.035 (in 3 folds),0.540 +/- 0.143 (in 3 folds),0.540 +/- 0.143 (in 3 folds),0.528 +/- 0.078 (in 3 folds),0.148 +/- 0.066 (in 3 folds),0.548,0.101,0.401 +/- 0.199 (in 3 folds),0.112 +/- 0.088 (in 3 folds),0.268 +/- 0.290 (in 3 folds),0.4,0.059,0.27,Unknown,84.0,31.0,115.0,0.269565,False,,,,
elasticnet_cv,0.516 +/- 0.040 (in 3 folds),0.516 +/- 0.040 (in 3 folds),0.557 +/- 0.172 (in 3 folds),0.557 +/- 0.172 (in 3 folds),0.537 +/- 0.066 (in 3 folds),0.096 +/- 0.111 (in 3 folds),0.536,0.071,0.513 +/- 0.045 (in 3 folds),0.084 +/- 0.096 (in 3 folds),0.064 +/- 0.018 (in 2 folds),0.513,0.062,0.043,Unknown,110.0,5.0,115.0,0.043478,False,0.480 +/- 0.000 (in 1 folds),0.480 +/- 0.000 (in 1 folds),0.510 +/- 0.000 (in 1 folds),0.510 +/- 0.000 (in 1 folds)
xgboost,0.514 +/- 0.035 (in 3 folds),0.514 +/- 0.035 (in 3 folds),0.530 +/- 0.154 (in 3 folds),0.530 +/- 0.154 (in 3 folds),0.547 +/- 0.035 (in 3 folds),0.109 +/- 0.033 (in 3 folds),0.546,0.091,0.513 +/- 0.026 (in 3 folds),0.094 +/- 0.029 (in 3 folds),0.061 +/- 0.014 (in 3 folds),0.513,0.079,0.061,Unknown,108.0,7.0,115.0,0.06087,False,,,,
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.510 +/- 0.155 (in 3 folds),0.510 +/- 0.155 (in 3 folds),0.393 +/- 0.084 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.393,-0.234,0.384 +/- 0.092 (in 3 folds),0.046 +/- 0.041 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.383,-0.224,0.026,Unknown,112.0,3.0,115.0,0.026087,False,0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.486 +/- 0.000 (in 1 folds),0.486 +/- 0.000 (in 1 folds)
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
linearsvm_ovr,0.598 +/- 0.035 (in 3 folds),0.598 +/- 0.035 (in 3 folds),0.591 +/- 0.133 (in 3 folds),0.591 +/- 0.133 (in 3 folds),0.576 +/- 0.132 (in 3 folds),0.192 +/- 0.117 (in 3 folds),0.577,0.162,0.556 +/- 0.129 (in 3 folds),0.179 +/- 0.102 (in 3 folds),0.035 +/- 0.016 (in 3 folds),0.557,0.149,0.035,Unknown,111,4,115,0.034783,False,,,,
dummy_stratified,0.598 +/- 0.029 (in 3 folds),0.598 +/- 0.029 (in 3 folds),0.565 +/- 0.170 (in 3 folds),0.565 +/- 0.170 (in 3 folds),0.575 +/- 0.051 (in 3 folds),0.191 +/- 0.064 (in 3 folds),0.574,0.149,0.540 +/- 0.054 (in 3 folds),0.169 +/- 0.059 (in 3 folds),0.061 +/- 0.014 (in 3 folds),0.539,0.133,0.061,Unknown,108,7,115,0.06087,False,,,,
lasso_multiclass,0.594 +/- 0.052 (in 3 folds),0.594 +/- 0.052 (in 3 folds),0.602 +/- 0.132 (in 3 folds),0.602 +/- 0.132 (in 3 folds),0.543 +/- 0.085 (in 3 folds),0.160 +/- 0.070 (in 3 folds),0.541,0.078,0.514 +/- 0.068 (in 3 folds),0.145 +/- 0.050 (in 3 folds),0.052 +/- 0.026 (in 3 folds),0.513,0.07,0.052,Unknown,109,6,115,0.052174,False,,,,
ridge_cv,0.587 +/- 0.064 (in 3 folds),0.587 +/- 0.064 (in 3 folds),0.638 +/- 0.099 (in 3 folds),0.638 +/- 0.099 (in 3 folds),0.393 +/- 0.084 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.393,-0.234,0.384 +/- 0.092 (in 3 folds),0.046 +/- 0.041 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.383,-0.224,0.026,Unknown,112,3,115,0.026087,False,0.567 +/- 0.000 (in 1 folds),0.567 +/- 0.000 (in 1 folds),0.630 +/- 0.000 (in 1 folds),0.630 +/- 0.000 (in 1 folds)
lasso_cv,0.533 +/- 0.044 (in 3 folds),0.533 +/- 0.044 (in 3 folds),0.551 +/- 0.186 (in 3 folds),0.551 +/- 0.186 (in 3 folds),0.523 +/- 0.015 (in 3 folds),0.176 +/- 0.111 (in 3 folds),0.523,0.045,0.495 +/- 0.015 (in 3 folds),0.144 +/- 0.117 (in 3 folds),0.052 +/- 0.002 (in 3 folds),0.496,0.038,0.052,Unknown,109,6,115,0.052174,False,,,,
rf_multiclass,0.524 +/- 0.035 (in 3 folds),0.524 +/- 0.035 (in 3 folds),0.540 +/- 0.143 (in 3 folds),0.540 +/- 0.143 (in 3 folds),0.528 +/- 0.078 (in 3 folds),0.148 +/- 0.066 (in 3 folds),0.548,0.101,0.401 +/- 0.199 (in 3 folds),0.112 +/- 0.088 (in 3 folds),0.268 +/- 0.290 (in 3 folds),0.4,0.059,0.27,Unknown,84,31,115,0.269565,False,,,,
elasticnet_cv,0.516 +/- 0.040 (in 3 folds),0.516 +/- 0.040 (in 3 folds),0.557 +/- 0.172 (in 3 folds),0.557 +/- 0.172 (in 3 folds),0.537 +/- 0.066 (in 3 folds),0.096 +/- 0.111 (in 3 folds),0.536,0.071,0.513 +/- 0.045 (in 3 folds),0.084 +/- 0.096 (in 3 folds),0.064 +/- 0.018 (in 2 folds),0.513,0.062,0.043,Unknown,110,5,115,0.043478,False,0.480 +/- 0.000 (in 1 folds),0.480 +/- 0.000 (in 1 folds),0.510 +/- 0.000 (in 1 folds),0.510 +/- 0.000 (in 1 folds)
xgboost,0.514 +/- 0.035 (in 3 folds),0.514 +/- 0.035 (in 3 folds),0.530 +/- 0.154 (in 3 folds),0.530 +/- 0.154 (in 3 folds),0.547 +/- 0.035 (in 3 folds),0.109 +/- 0.033 (in 3 folds),0.546,0.091,0.513 +/- 0.026 (in 3 folds),0.094 +/- 0.029 (in 3 folds),0.061 +/- 0.014 (in 3 folds),0.513,0.079,0.061,Unknown,108,7,115,0.06087,False,,,,
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.510 +/- 0.155 (in 3 folds),0.510 +/- 0.155 (in 3 folds),0.393 +/- 0.084 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.393,-0.234,0.384 +/- 0.092 (in 3 folds),0.046 +/- 0.041 (in 3 folds),0.038 +/- 0.018 (in 2 folds),0.383,-0.224,0.026,Unknown,112,3,115,0.026087,False,0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.486 +/- 0.000 (in 1 folds),0.486 +/- 0.000 (in 1 folds)


linearsvm_ovr,dummy_stratified,lasso_multiclass,ridge_cv
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.598 +/- 0.035 (in 3 folds) ROC-AUC (macro OvO): 0.598 +/- 0.035 (in 3 folds) au-PRC (weighted OvO): 0.591 +/- 0.133 (in 3 folds) au-PRC (macro OvO): 0.591 +/- 0.133 (in 3 folds) Accuracy: 0.576 +/- 0.132 (in 3 folds) MCC: 0.192 +/- 0.117 (in 3 folds) Global scores without abstention: Accuracy: 0.577 MCC: 0.162 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.556 +/- 0.129 (in 3 folds) MCC: 0.179 +/- 0.102 (in 3 folds) Unknown/abstention proportion: 0.035 +/- 0.016 (in 3 folds) Global scores with abstention: Accuracy: 0.557 MCC: 0.149 Unknown/abstention proportion: 0.035 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.63 0.30 0.41 56  M 0.56 0.80 0.66 59  Unknown 0.00 0.00 0.00 0  accuracy 0.56 115  macro avg 0.40 0.37 0.36 115 weighted avg 0.59 0.56 0.54 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.598 +/- 0.029 (in 3 folds) ROC-AUC (macro OvO): 0.598 +/- 0.029 (in 3 folds) au-PRC (weighted OvO): 0.565 +/- 0.170 (in 3 folds) au-PRC (macro OvO): 0.565 +/- 0.170 (in 3 folds) Accuracy: 0.575 +/- 0.051 (in 3 folds) MCC: 0.191 +/- 0.064 (in 3 folds) Global scores without abstention: Accuracy: 0.574 MCC: 0.149 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.540 +/- 0.054 (in 3 folds) MCC: 0.169 +/- 0.059 (in 3 folds) Unknown/abstention proportion: 0.061 +/- 0.014 (in 3 folds) Global scores with abstention: Accuracy: 0.539 MCC: 0.133 Unknown/abstention proportion: 0.061 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.56 0.55 0.56 56  M 0.58 0.53 0.55 59  Unknown 0.00 0.00 0.00 0  accuracy 0.54 115  macro avg 0.38 0.36 0.37 115 weighted avg 0.57 0.54 0.56 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.594 +/- 0.052 (in 3 folds) ROC-AUC (macro OvO): 0.594 +/- 0.052 (in 3 folds) au-PRC (weighted OvO): 0.602 +/- 0.132 (in 3 folds) au-PRC (macro OvO): 0.602 +/- 0.132 (in 3 folds) Accuracy: 0.543 +/- 0.085 (in 3 folds) MCC: 0.160 +/- 0.070 (in 3 folds) Global scores without abstention: Accuracy: 0.541 MCC: 0.078 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.514 +/- 0.068 (in 3 folds) MCC: 0.145 +/- 0.050 (in 3 folds) Unknown/abstention proportion: 0.052 +/- 0.026 (in 3 folds) Global scores with abstention: Accuracy: 0.513 MCC: 0.070 Unknown/abstention proportion: 0.052 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.55 0.32 0.40 56  M 0.54 0.69 0.61 59  Unknown 0.00 0.00 0.00 0  accuracy 0.51 115  macro avg 0.36 0.34 0.34 115 weighted avg 0.54 0.51 0.51 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.587 +/- 0.064 (in 3 folds) ROC-AUC (macro OvO): 0.587 +/- 0.064 (in 3 folds) au-PRC (weighted OvO): 0.638 +/- 0.099 (in 3 folds) au-PRC (macro OvO): 0.638 +/- 0.099 (in 3 folds) Accuracy: 0.393 +/- 0.084 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.393 MCC: -0.234 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.384 +/- 0.092 (in 3 folds) MCC: 0.046 +/- 0.041 (in 3 folds) Unknown/abstention proportion: 0.038 +/- 0.018 (in 2 folds) ROC-AUC (weighted OvO): 0.567 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.567 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.630 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.630 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.383 MCC: -0.224 Unknown/abstention proportion: 0.026 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.32 0.21 0.26 56  M 0.43 0.54 0.48 59  Unknown 0.00 0.00 0.00 0  accuracy 0.38 115  macro avg 0.25 0.25 0.25 115 weighted avg 0.38 0.38 0.37 115
,,,


lasso_cv,rf_multiclass,elasticnet_cv,xgboost
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.533 +/- 0.044 (in 3 folds) ROC-AUC (macro OvO): 0.533 +/- 0.044 (in 3 folds) au-PRC (weighted OvO): 0.551 +/- 0.186 (in 3 folds) au-PRC (macro OvO): 0.551 +/- 0.186 (in 3 folds) Accuracy: 0.523 +/- 0.015 (in 3 folds) MCC: 0.176 +/- 0.111 (in 3 folds) Global scores without abstention: Accuracy: 0.523 MCC: 0.045 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.495 +/- 0.015 (in 3 folds) MCC: 0.144 +/- 0.117 (in 3 folds) Unknown/abstention proportion: 0.052 +/- 0.002 (in 3 folds) Global scores with abstention: Accuracy: 0.496 MCC: 0.038 Unknown/abstention proportion: 0.052 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.52 0.41 0.46 56  M 0.52 0.58 0.55 59  Unknown 0.00 0.00 0.00 0  accuracy 0.50 115  macro avg 0.35 0.33 0.34 115 weighted avg 0.52 0.50 0.51 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.524 +/- 0.035 (in 3 folds) ROC-AUC (macro OvO): 0.524 +/- 0.035 (in 3 folds) au-PRC (weighted OvO): 0.540 +/- 0.143 (in 3 folds) au-PRC (macro OvO): 0.540 +/- 0.143 (in 3 folds) Accuracy: 0.528 +/- 0.078 (in 3 folds) MCC: 0.148 +/- 0.066 (in 3 folds) Global scores without abstention: Accuracy: 0.548 MCC: 0.101 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.401 +/- 0.199 (in 3 folds) MCC: 0.112 +/- 0.088 (in 3 folds) Unknown/abstention proportion: 0.268 +/- 0.290 (in 3 folds) Global scores with abstention: Accuracy: 0.400 MCC: 0.059 Unknown/abstention proportion: 0.270 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.59 0.41 0.48 56  M 0.51 0.39 0.44 59  Unknown 0.00 0.00 0.00 0  accuracy 0.40 115  macro avg 0.37 0.27 0.31 115 weighted avg 0.55 0.40 0.46 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.516 +/- 0.040 (in 3 folds) ROC-AUC (macro OvO): 0.516 +/- 0.040 (in 3 folds) au-PRC (weighted OvO): 0.557 +/- 0.172 (in 3 folds) au-PRC (macro OvO): 0.557 +/- 0.172 (in 3 folds) Accuracy: 0.537 +/- 0.066 (in 3 folds) MCC: 0.096 +/- 0.111 (in 3 folds) Global scores without abstention: Accuracy: 0.536 MCC: 0.071 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.513 +/- 0.045 (in 3 folds) MCC: 0.084 +/- 0.096 (in 3 folds) Unknown/abstention proportion: 0.064 +/- 0.018 (in 2 folds) ROC-AUC (weighted OvO): 0.480 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.480 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.510 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.510 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.513 MCC: 0.062 Unknown/abstention proportion: 0.043 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.55 0.32 0.40 56  M 0.53 0.69 0.60 59  Unknown 0.00 0.00 0.00 0  accuracy 0.51 115  macro avg 0.36 0.34 0.34 115 weighted avg 0.54 0.51 0.51 115,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.514 +/- 0.035 (in 3 folds) ROC-AUC (macro OvO): 0.514 +/- 0.035 (in 3 folds) au-PRC (weighted OvO): 0.530 +/- 0.154 (in 3 folds) au-PRC (macro OvO): 0.530 +/- 0.154 (in 3 folds) Accuracy: 0.547 +/- 0.035 (in 3 folds) MCC: 0.109 +/- 0.033 (in 3 folds) Global scores without abstention: Accuracy: 0.546 MCC: 0.091 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.513 +/- 0.026 (in 3 folds) MCC: 0.094 +/- 0.029 (in 3 folds) Unknown/abstention proportion: 0.061 +/- 0.014 (in 3 folds) Global scores with abstention: Accuracy: 0.513 MCC: 0.079 Unknown/abstention proportion: 0.061 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.55 0.39 0.46 56  M 0.54 0.63 0.58 59  Unknown 0.00 0.00 0.00 0  accuracy 0.51 115  macro avg 0.36 0.34 0.35 115 weighted avg 0.55 0.51 0.52 115
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.510 +/- 0.155 (in 3 folds) au-PRC (macro OvO): 0.510 +/- 0.155 (in 3 folds) Accuracy: 0.393 +/- 0.084 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.393 MCC: -0.234 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.384 +/- 0.092 (in 3 folds) MCC: 0.046 +/- 0.041 (in 3 folds) Unknown/abstention proportion: 0.038 +/- 0.018 (in 2 folds) ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.486 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.486 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.383 MCC: -0.224 Unknown/abstention proportion: 0.026 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.32 0.21 0.26 56  M 0.43 0.54 0.48 59  Unknown 0.00 0.00 0.00 0  accuracy 0.38 115  macro avg 0.25 0.25 0.25 115 weighted avg 0.38 0.38 0.37 115


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.590 +/- 0.065 (in 3 folds),0.590 +/- 0.065 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.549 +/- 0.062 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.547,0.071,0.537 +/- 0.075 (in 3 folds),0.001 +/- 0.001 (in 3 folds),0.068 +/- 0.000 (in 1 folds),0.621 +/- 0.050 (in 2 folds),0.621 +/- 0.050 (in 2 folds),0.683 +/- 0.015 (in 2 folds),0.683 +/- 0.015 (in 2 folds),0.533,0.068,0.024,Unknown,161.0,4.0,165.0,0.024242,False
ridge_cv.decision_thresholds_tuned,0.590 +/- 0.065 (in 3 folds),0.590 +/- 0.065 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.531 +/- 0.077 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.528,0.033,0.520 +/- 0.088 (in 3 folds),-0.001 +/- 0.001 (in 3 folds),0.068 +/- 0.000 (in 1 folds),0.621 +/- 0.050 (in 2 folds),0.621 +/- 0.050 (in 2 folds),0.683 +/- 0.015 (in 2 folds),0.683 +/- 0.015 (in 2 folds),0.515,0.032,0.024,Unknown,161.0,4.0,165.0,0.024242,False
linearsvm_ovr,0.548 +/- 0.095 (in 3 folds),0.548 +/- 0.095 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.594 +/- 0.085 (in 3 folds),0.154 +/- 0.158 (in 3 folds),0.593,0.158,0.585 +/- 0.099 (in 3 folds),0.162 +/- 0.144 (in 3 folds),0.054 +/- 0.000 (in 1 folds),0.602 +/- 0.019 (in 2 folds),0.602 +/- 0.019 (in 2 folds),0.643 +/- 0.065 (in 2 folds),0.643 +/- 0.065 (in 2 folds),0.582,0.161,0.018,Unknown,162.0,3.0,165.0,0.018182,False
linearsvm_ovr.decision_thresholds_tuned,0.548 +/- 0.095 (in 3 folds),0.548 +/- 0.095 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.592 +/- 0.051 (in 3 folds),0.177 +/- 0.133 (in 3 folds),0.593,0.16,0.580 +/- 0.035 (in 3 folds),0.176 +/- 0.131 (in 3 folds),0.054 +/- 0.000 (in 1 folds),0.602 +/- 0.019 (in 2 folds),0.602 +/- 0.019 (in 2 folds),0.643 +/- 0.065 (in 2 folds),0.643 +/- 0.065 (in 2 folds),0.582,0.161,0.018,Unknown,162.0,3.0,165.0,0.018182,False
lasso_multiclass,0.510 +/- 0.074 (in 3 folds),0.510 +/- 0.074 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.546 +/- 0.064 (in 3 folds),0.025 +/- 0.047 (in 3 folds),0.545,0.055,0.520 +/- 0.088 (in 3 folds),0.030 +/- 0.037 (in 3 folds),0.078 +/- 0.034 (in 2 folds),0.587 +/- 0.000 (in 1 folds),0.587 +/- 0.000 (in 1 folds),0.693 +/- 0.000 (in 1 folds),0.693 +/- 0.000 (in 1 folds),0.515,0.06,0.055,Unknown,156.0,9.0,165.0,0.054545,False
lasso_multiclass.decision_thresholds_tuned,0.510 +/- 0.074 (in 3 folds),0.510 +/- 0.074 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.590 +/- 0.048 (in 3 folds),0.217 +/- 0.071 (in 3 folds),0.59,0.14,0.560 +/- 0.060 (in 3 folds),0.196 +/- 0.083 (in 3 folds),0.078 +/- 0.034 (in 2 folds),0.587 +/- 0.000 (in 1 folds),0.587 +/- 0.000 (in 1 folds),0.693 +/- 0.000 (in 1 folds),0.693 +/- 0.000 (in 1 folds),0.558,0.142,0.055,Unknown,156.0,9.0,165.0,0.054545,False
elasticnet_cv,0.505 +/- 0.087 (in 3 folds),0.505 +/- 0.087 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.498 +/- 0.027 (in 3 folds),-0.016 +/- 0.049 (in 3 folds),0.5,-0.028,0.472 +/- 0.041 (in 3 folds),-0.017 +/- 0.041 (in 3 folds),0.081 +/- 0.029 (in 2 folds),0.601 +/- 0.000 (in 1 folds),0.601 +/- 0.000 (in 1 folds),0.706 +/- 0.000 (in 1 folds),0.706 +/- 0.000 (in 1 folds),0.473,-0.022,0.055,Unknown,156.0,9.0,165.0,0.054545,False
elasticnet_cv.decision_thresholds_tuned,0.505 +/- 0.087 (in 3 folds),0.505 +/- 0.087 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.520 +/- 0.017 (in 3 folds),-0.053 +/- 0.169 (in 3 folds),0.519,-0.096,0.492 +/- 0.015 (in 3 folds),-0.057 +/- 0.136 (in 3 folds),0.081 +/- 0.029 (in 2 folds),0.601 +/- 0.000 (in 1 folds),0.601 +/- 0.000 (in 1 folds),0.706 +/- 0.000 (in 1 folds),0.706 +/- 0.000 (in 1 folds),0.491,-0.05,0.055,Unknown,156.0,9.0,165.0,0.054545,False
lasso_cv,0.477 +/- 0.056 (in 3 folds),0.477 +/- 0.056 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.526 +/- 0.051 (in 3 folds),0.034 +/- 0.114 (in 3 folds),0.529,0.05,0.494 +/- 0.047 (in 3 folds),0.055 +/- 0.103 (in 3 folds),0.060 +/- 0.007 (in 3 folds),,,,,0.497,0.046,0.061,Unknown,155.0,10.0,165.0,0.060606,False
lasso_cv.decision_thresholds_tuned,0.477 +/- 0.056 (in 3 folds),0.477 +/- 0.056 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.551 +/- 0.078 (in 3 folds),0.108 +/- 0.160 (in 3 folds),0.555,0.112,0.518 +/- 0.075 (in 3 folds),0.102 +/- 0.155 (in 3 folds),0.060 +/- 0.007 (in 3 folds),,,,,0.521,0.099,0.061,Unknown,155.0,10.0,165.0,0.060606,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
ridge_cv,0.590 +/- 0.065 (in 3 folds),0.590 +/- 0.065 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.549 +/- 0.062 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.547,0.071,0.537 +/- 0.075 (in 3 folds),0.001 +/- 0.001 (in 3 folds),0.068 +/- 0.000 (in 1 folds),0.621 +/- 0.050 (in 2 folds),0.621 +/- 0.050 (in 2 folds),0.683 +/- 0.015 (in 2 folds),0.683 +/- 0.015 (in 2 folds),0.533,0.068,0.024,Unknown,161,4,165,0.024242,False
ridge_cv.decision_thresholds_tuned,0.590 +/- 0.065 (in 3 folds),0.590 +/- 0.065 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.630 +/- 0.092 (in 3 folds),0.531 +/- 0.077 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.528,0.033,0.520 +/- 0.088 (in 3 folds),-0.001 +/- 0.001 (in 3 folds),0.068 +/- 0.000 (in 1 folds),0.621 +/- 0.050 (in 2 folds),0.621 +/- 0.050 (in 2 folds),0.683 +/- 0.015 (in 2 folds),0.683 +/- 0.015 (in 2 folds),0.515,0.032,0.024,Unknown,161,4,165,0.024242,False
linearsvm_ovr,0.548 +/- 0.095 (in 3 folds),0.548 +/- 0.095 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.594 +/- 0.085 (in 3 folds),0.154 +/- 0.158 (in 3 folds),0.593,0.158,0.585 +/- 0.099 (in 3 folds),0.162 +/- 0.144 (in 3 folds),0.054 +/- 0.000 (in 1 folds),0.602 +/- 0.019 (in 2 folds),0.602 +/- 0.019 (in 2 folds),0.643 +/- 0.065 (in 2 folds),0.643 +/- 0.065 (in 2 folds),0.582,0.161,0.018,Unknown,162,3,165,0.018182,False
linearsvm_ovr.decision_thresholds_tuned,0.548 +/- 0.095 (in 3 folds),0.548 +/- 0.095 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.614 +/- 0.067 (in 3 folds),0.592 +/- 0.051 (in 3 folds),0.177 +/- 0.133 (in 3 folds),0.593,0.16,0.580 +/- 0.035 (in 3 folds),0.176 +/- 0.131 (in 3 folds),0.054 +/- 0.000 (in 1 folds),0.602 +/- 0.019 (in 2 folds),0.602 +/- 0.019 (in 2 folds),0.643 +/- 0.065 (in 2 folds),0.643 +/- 0.065 (in 2 folds),0.582,0.161,0.018,Unknown,162,3,165,0.018182,False
lasso_multiclass,0.510 +/- 0.074 (in 3 folds),0.510 +/- 0.074 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.546 +/- 0.064 (in 3 folds),0.025 +/- 0.047 (in 3 folds),0.545,0.055,0.520 +/- 0.088 (in 3 folds),0.030 +/- 0.037 (in 3 folds),0.078 +/- 0.034 (in 2 folds),0.587 +/- 0.000 (in 1 folds),0.587 +/- 0.000 (in 1 folds),0.693 +/- 0.000 (in 1 folds),0.693 +/- 0.000 (in 1 folds),0.515,0.06,0.055,Unknown,156,9,165,0.054545,False
lasso_multiclass.decision_thresholds_tuned,0.510 +/- 0.074 (in 3 folds),0.510 +/- 0.074 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.587 +/- 0.095 (in 3 folds),0.590 +/- 0.048 (in 3 folds),0.217 +/- 0.071 (in 3 folds),0.59,0.14,0.560 +/- 0.060 (in 3 folds),0.196 +/- 0.083 (in 3 folds),0.078 +/- 0.034 (in 2 folds),0.587 +/- 0.000 (in 1 folds),0.587 +/- 0.000 (in 1 folds),0.693 +/- 0.000 (in 1 folds),0.693 +/- 0.000 (in 1 folds),0.558,0.142,0.055,Unknown,156,9,165,0.054545,False
elasticnet_cv,0.505 +/- 0.087 (in 3 folds),0.505 +/- 0.087 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.498 +/- 0.027 (in 3 folds),-0.016 +/- 0.049 (in 3 folds),0.5,-0.028,0.472 +/- 0.041 (in 3 folds),-0.017 +/- 0.041 (in 3 folds),0.081 +/- 0.029 (in 2 folds),0.601 +/- 0.000 (in 1 folds),0.601 +/- 0.000 (in 1 folds),0.706 +/- 0.000 (in 1 folds),0.706 +/- 0.000 (in 1 folds),0.473,-0.022,0.055,Unknown,156,9,165,0.054545,False
elasticnet_cv.decision_thresholds_tuned,0.505 +/- 0.087 (in 3 folds),0.505 +/- 0.087 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.604 +/- 0.101 (in 3 folds),0.520 +/- 0.017 (in 3 folds),-0.053 +/- 0.169 (in 3 folds),0.519,-0.096,0.492 +/- 0.015 (in 3 folds),-0.057 +/- 0.136 (in 3 folds),0.081 +/- 0.029 (in 2 folds),0.601 +/- 0.000 (in 1 folds),0.601 +/- 0.000 (in 1 folds),0.706 +/- 0.000 (in 1 folds),0.706 +/- 0.000 (in 1 folds),0.491,-0.05,0.055,Unknown,156,9,165,0.054545,False
lasso_cv,0.477 +/- 0.056 (in 3 folds),0.477 +/- 0.056 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.526 +/- 0.051 (in 3 folds),0.034 +/- 0.114 (in 3 folds),0.529,0.05,0.494 +/- 0.047 (in 3 folds),0.055 +/- 0.103 (in 3 folds),0.060 +/- 0.007 (in 3 folds),,,,,0.497,0.046,0.061,Unknown,155,10,165,0.060606,False
lasso_cv.decision_thresholds_tuned,0.477 +/- 0.056 (in 3 folds),0.477 +/- 0.056 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.563 +/- 0.036 (in 3 folds),0.551 +/- 0.078 (in 3 folds),0.108 +/- 0.160 (in 3 folds),0.555,0.112,0.518 +/- 0.075 (in 3 folds),0.102 +/- 0.155 (in 3 folds),0.060 +/- 0.007 (in 3 folds),,,,,0.521,0.099,0.061,Unknown,155,10,165,0.060606,False


ridge_cv,ridge_cv.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.590 +/- 0.065 (in 3 folds) ROC-AUC (macro OvO): 0.590 +/- 0.065 (in 3 folds) au-PRC (weighted OvO): 0.630 +/- 0.092 (in 3 folds) au-PRC (macro OvO): 0.630 +/- 0.092 (in 3 folds) Accuracy: 0.549 +/- 0.062 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.547 MCC: 0.071 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.621 +/- 0.050 (in 2 folds) ROC-AUC (macro OvO): 0.621 +/- 0.050 (in 2 folds) au-PRC (weighted OvO): 0.683 +/- 0.015 (in 2 folds) au-PRC (macro OvO): 0.683 +/- 0.015 (in 2 folds) Accuracy: 0.537 +/- 0.075 (in 3 folds) MCC: 0.001 +/- 0.001 (in 3 folds) Unknown/abstention proportion: 0.068 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.533 MCC: 0.068 Unknown/abstention proportion: 0.024 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.51 0.37 0.43 76  M 0.57 0.67 0.62 89  Unknown 0.00 0.00 0.00 0  accuracy 0.53 165  macro avg 0.36 0.35 0.35 165 weighted avg 0.54 0.53 0.53 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.590 +/- 0.065 (in 3 folds) ROC-AUC (macro OvO): 0.590 +/- 0.065 (in 3 folds) au-PRC (weighted OvO): 0.630 +/- 0.092 (in 3 folds) au-PRC (macro OvO): 0.630 +/- 0.092 (in 3 folds) Accuracy: 0.531 +/- 0.077 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.528 MCC: 0.033 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.621 +/- 0.050 (in 2 folds) ROC-AUC (macro OvO): 0.621 +/- 0.050 (in 2 folds) au-PRC (weighted OvO): 0.683 +/- 0.015 (in 2 folds) au-PRC (macro OvO): 0.683 +/- 0.015 (in 2 folds) Accuracy: 0.520 +/- 0.088 (in 3 folds) MCC: -0.001 +/- 0.001 (in 3 folds) Unknown/abstention proportion: 0.068 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.515 MCC: 0.032 Unknown/abstention proportion: 0.024 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.48 0.36 0.41 76  M 0.55 0.65 0.60 89  Unknown 0.00 0.00 0.00 0  accuracy 0.52 165  macro avg 0.34 0.34 0.34 165 weighted avg 0.52 0.52 0.51 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.548 +/- 0.095 (in 3 folds) ROC-AUC (macro OvO): 0.548 +/- 0.095 (in 3 folds) au-PRC (weighted OvO): 0.614 +/- 0.067 (in 3 folds) au-PRC (macro OvO): 0.614 +/- 0.067 (in 3 folds) Accuracy: 0.594 +/- 0.085 (in 3 folds) MCC: 0.154 +/- 0.158 (in 3 folds) Global scores without abstention: Accuracy: 0.593 MCC: 0.158 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.585 +/- 0.099 (in 3 folds) MCC: 0.162 +/- 0.144 (in 3 folds) Unknown/abstention proportion: 0.054 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.602 +/- 0.019 (in 2 folds) ROC-AUC (macro OvO): 0.602 +/- 0.019 (in 2 folds) au-PRC (weighted OvO): 0.643 +/- 0.065 (in 2 folds) au-PRC (macro OvO): 0.643 +/- 0.065 (in 2 folds) Global scores with abstention: Accuracy: 0.582 MCC: 0.161 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.58 0.34 0.43 76  M 0.60 0.79 0.68 89  Unknown 0.00 0.00 0.00 0  accuracy 0.58 165  macro avg 0.39 0.38 0.37 165 weighted avg 0.59 0.58 0.56 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.548 +/- 0.095 (in 3 folds) ROC-AUC (macro OvO): 0.548 +/- 0.095 (in 3 folds) au-PRC (weighted OvO): 0.614 +/- 0.067 (in 3 folds) au-PRC (macro OvO): 0.614 +/- 0.067 (in 3 folds) Accuracy: 0.592 +/- 0.051 (in 3 folds) MCC: 0.177 +/- 0.133 (in 3 folds) Global scores without abstention: Accuracy: 0.593 MCC: 0.160 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.580 +/- 0.035 (in 3 folds) MCC: 0.176 +/- 0.131 (in 3 folds) Unknown/abstention proportion: 0.054 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.602 +/- 0.019 (in 2 folds) ROC-AUC (macro OvO): 0.602 +/- 0.019 (in 2 folds) au-PRC (weighted OvO): 0.643 +/- 0.065 (in 2 folds) au-PRC (macro OvO): 0.643 +/- 0.065 (in 2 folds) Global scores with abstention: Accuracy: 0.582 MCC: 0.161 Unknown/abstention proportion: 0.018 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.57 0.37 0.45 76  M 0.60 0.76 0.67 89  Unknown 0.00 0.00 0.00 0  accuracy 0.58 165  macro avg 0.39 0.38 0.37 165 weighted avg 0.59 0.58 0.57 165
,,,


lasso_multiclass,lasso_multiclass.decision_thresholds_tuned,elasticnet_cv,elasticnet_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.510 +/- 0.074 (in 3 folds) ROC-AUC (macro OvO): 0.510 +/- 0.074 (in 3 folds) au-PRC (weighted OvO): 0.587 +/- 0.095 (in 3 folds) au-PRC (macro OvO): 0.587 +/- 0.095 (in 3 folds) Accuracy: 0.546 +/- 0.064 (in 3 folds) MCC: 0.025 +/- 0.047 (in 3 folds) Global scores without abstention: Accuracy: 0.545 MCC: 0.055 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.520 +/- 0.088 (in 3 folds) MCC: 0.030 +/- 0.037 (in 3 folds) Unknown/abstention proportion: 0.078 +/- 0.034 (in 2 folds) ROC-AUC (weighted OvO): 0.587 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.587 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.693 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.693 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.515 MCC: 0.060 Unknown/abstention proportion: 0.055 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.48 0.33 0.39 76  M 0.58 0.67 0.62 89  Unknown 0.00 0.00 0.00 0  accuracy 0.52 165  macro avg 0.35 0.33 0.34 165 weighted avg 0.53 0.52 0.52 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.510 +/- 0.074 (in 3 folds) ROC-AUC (macro OvO): 0.510 +/- 0.074 (in 3 folds) au-PRC (weighted OvO): 0.587 +/- 0.095 (in 3 folds) au-PRC (macro OvO): 0.587 +/- 0.095 (in 3 folds) Accuracy: 0.590 +/- 0.048 (in 3 folds) MCC: 0.217 +/- 0.071 (in 3 folds) Global scores without abstention: Accuracy: 0.590 MCC: 0.140 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.560 +/- 0.060 (in 3 folds) MCC: 0.196 +/- 0.083 (in 3 folds) Unknown/abstention proportion: 0.078 +/- 0.034 (in 2 folds) ROC-AUC (weighted OvO): 0.587 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.587 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.693 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.693 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.558 MCC: 0.142 Unknown/abstention proportion: 0.055 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.57 0.26 0.36 76  M 0.60 0.81 0.69 89  Unknown 0.00 0.00 0.00 0  accuracy 0.56 165  macro avg 0.39 0.36 0.35 165 weighted avg 0.58 0.56 0.54 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.505 +/- 0.087 (in 3 folds) ROC-AUC (macro OvO): 0.505 +/- 0.087 (in 3 folds) au-PRC (weighted OvO): 0.604 +/- 0.101 (in 3 folds) au-PRC (macro OvO): 0.604 +/- 0.101 (in 3 folds) Accuracy: 0.498 +/- 0.027 (in 3 folds) MCC: -0.016 +/- 0.049 (in 3 folds) Global scores without abstention: Accuracy: 0.500 MCC: -0.028 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.601 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.601 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.706 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.706 +/- 0.000 (in 1 folds) Accuracy: 0.472 +/- 0.041 (in 3 folds) MCC: -0.017 +/- 0.041 (in 3 folds) Unknown/abstention proportion: 0.081 +/- 0.029 (in 2 folds) Global scores with abstention: Accuracy: 0.473 MCC: -0.022 Unknown/abstention proportion: 0.055 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.44 0.32 0.37 76  M 0.53 0.61 0.57 89  Unknown 0.00 0.00 0.00 0  accuracy 0.47 165  macro avg 0.32 0.31 0.31 165 weighted avg 0.49 0.47 0.48 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.505 +/- 0.087 (in 3 folds) ROC-AUC (macro OvO): 0.505 +/- 0.087 (in 3 folds) au-PRC (weighted OvO): 0.604 +/- 0.101 (in 3 folds) au-PRC (macro OvO): 0.604 +/- 0.101 (in 3 folds) Accuracy: 0.520 +/- 0.017 (in 3 folds) MCC: -0.053 +/- 0.169 (in 3 folds) Global scores without abstention: Accuracy: 0.519 MCC: -0.096 Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.601 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.601 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.706 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.706 +/- 0.000 (in 1 folds) Accuracy: 0.492 +/- 0.015 (in 3 folds) MCC: -0.057 +/- 0.136 (in 3 folds) Unknown/abstention proportion: 0.081 +/- 0.029 (in 2 folds) Global scores with abstention: Accuracy: 0.491 MCC: -0.050 Unknown/abstention proportion: 0.055 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.25 0.03 0.05 76  M 0.53 0.89 0.67 89  Unknown 0.00 0.00 0.00 0  accuracy 0.49 165  macro avg 0.26 0.30 0.24 165 weighted avg 0.40 0.49 0.38 165
,,,


lasso_cv,lasso_cv.decision_thresholds_tuned,xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.477 +/- 0.056 (in 3 folds) ROC-AUC (macro OvO): 0.477 +/- 0.056 (in 3 folds) au-PRC (weighted OvO): 0.563 +/- 0.036 (in 3 folds) au-PRC (macro OvO): 0.563 +/- 0.036 (in 3 folds) Accuracy: 0.526 +/- 0.051 (in 3 folds) MCC: 0.034 +/- 0.114 (in 3 folds) Global scores without abstention: Accuracy: 0.529 MCC: 0.050 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.494 +/- 0.047 (in 3 folds) MCC: 0.055 +/- 0.103 (in 3 folds) Unknown/abstention proportion: 0.060 +/- 0.007 (in 3 folds) Global scores with abstention: Accuracy: 0.497 MCC: 0.046 Unknown/abstention proportion: 0.061 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.48 0.45 0.46 76  M 0.57 0.54 0.55 89  Unknown 0.00 0.00 0.00 0  accuracy 0.50 165  macro avg 0.35 0.33 0.34 165 weighted avg 0.53 0.50 0.51 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.477 +/- 0.056 (in 3 folds) ROC-AUC (macro OvO): 0.477 +/- 0.056 (in 3 folds) au-PRC (weighted OvO): 0.563 +/- 0.036 (in 3 folds) au-PRC (macro OvO): 0.563 +/- 0.036 (in 3 folds) Accuracy: 0.551 +/- 0.078 (in 3 folds) MCC: 0.108 +/- 0.160 (in 3 folds) Global scores without abstention: Accuracy: 0.555 MCC: 0.112 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.518 +/- 0.075 (in 3 folds) MCC: 0.102 +/- 0.155 (in 3 folds) Unknown/abstention proportion: 0.060 +/- 0.007 (in 3 folds) Global scores with abstention: Accuracy: 0.521 MCC: 0.099 Unknown/abstention proportion: 0.061 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.51 0.53 0.52 76  M 0.61 0.52 0.56 89  Unknown 0.00 0.00 0.00 0  accuracy 0.52 165  macro avg 0.37 0.35 0.36 165 weighted avg 0.56 0.52 0.54 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.475 +/- 0.069 (in 3 folds) ROC-AUC (macro OvO): 0.475 +/- 0.069 (in 3 folds) au-PRC (weighted OvO): 0.545 +/- 0.073 (in 3 folds) au-PRC (macro OvO): 0.545 +/- 0.073 (in 3 folds) Accuracy: 0.539 +/- 0.073 (in 3 folds) MCC: 0.055 +/- 0.137 (in 3 folds) Global scores without abstention: Accuracy: 0.536 MCC: 0.048 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.501 +/- 0.078 (in 3 folds) MCC: 0.060 +/- 0.116 (in 3 folds) Unknown/abstention proportion: 0.072 +/- 0.026 (in 3 folds) Global scores with abstention: Accuracy: 0.497 MCC: 0.048 Unknown/abstention proportion: 0.073 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.47 0.37 0.41 76  M 0.57 0.61 0.59 89  Unknown 0.00 0.00 0.00 0  accuracy 0.50 165  macro avg 0.35 0.33 0.33 165 weighted avg 0.53 0.50 0.51 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.475 +/- 0.069 (in 3 folds) ROC-AUC (macro OvO): 0.475 +/- 0.069 (in 3 folds) au-PRC (weighted OvO): 0.545 +/- 0.073 (in 3 folds) au-PRC (macro OvO): 0.545 +/- 0.073 (in 3 folds) Accuracy: 0.570 +/- 0.055 (in 3 folds) MCC: 0.125 +/- 0.094 (in 3 folds) Global scores without abstention: Accuracy: 0.569 MCC: 0.117 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.530 +/- 0.064 (in 3 folds) MCC: 0.122 +/- 0.095 (in 3 folds) Unknown/abstention proportion: 0.072 +/- 0.026 (in 3 folds) Global scores with abstention: Accuracy: 0.527 MCC: 0.107 Unknown/abstention proportion: 0.073 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.52 0.41 0.46 76  M 0.60 0.63 0.62 89  Unknown 0.00 0.00 0.00 0  accuracy 0.53 165  macro avg 0.37 0.35 0.36 165 weighted avg 0.56 0.53 0.54 165
,,,


rf_multiclass,rf_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.429 +/- 0.022 (in 3 folds) ROC-AUC (macro OvO): 0.429 +/- 0.022 (in 3 folds) au-PRC (weighted OvO): 0.573 +/- 0.126 (in 3 folds) au-PRC (macro OvO): 0.573 +/- 0.126 (in 3 folds) Accuracy: 0.435 +/- 0.130 (in 3 folds) MCC: -0.079 +/- 0.108 (in 3 folds) Global scores without abstention: Accuracy: 0.481 MCC: -0.078 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.321 +/- 0.231 (in 3 folds) MCC: -0.064 +/- 0.056 (in 3 folds) Unknown/abstention proportion: 0.506 +/- 0.363 (in 2 folds) ROC-AUC (weighted OvO): 0.410 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.410 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.585 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.585 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.309 MCC: -0.032 Unknown/abstention proportion: 0.358 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.38 0.20 0.26 76  M 0.55 0.40 0.46 89  Unknown 0.00 0.00 0.00 0  accuracy 0.31 165  macro avg 0.31 0.20 0.24 165 weighted avg 0.47 0.31 0.37 165,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.429 +/- 0.022 (in 3 folds) ROC-AUC (macro OvO): 0.429 +/- 0.022 (in 3 folds) au-PRC (weighted OvO): 0.573 +/- 0.126 (in 3 folds) au-PRC (macro OvO): 0.573 +/- 0.126 (in 3 folds) Accuracy: 0.435 +/- 0.130 (in 3 folds) MCC: -0.079 +/- 0.108 (in 3 folds) Global scores without abstention: Accuracy: 0.481 MCC: -0.078 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.321 +/- 0.231 (in 3 folds) MCC: -0.064 +/- 0.056 (in 3 folds) Unknown/abstention proportion: 0.506 +/- 0.363 (in 2 folds) ROC-AUC (weighted OvO): 0.410 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.410 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.585 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.585 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.309 MCC: -0.032 Unknown/abstention proportion: 0.358 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support  F 0.38 0.20 0.26 76  M 0.55 0.40 0.46 89  Unknown 0.00 0.00 0.00 0  accuracy 0.31 165  macro avg 0.31 0.20 0.24 165 weighted avg 0.47 0.31 0.37 165
,


---

# GeneLocus.TCR, TargetObsColumnEnum.covid_vs_healthy trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.964 +/- 0.039 (in 3 folds),0.964 +/- 0.039 (in 3 folds),0.991 +/- 0.010 (in 3 folds),0.991 +/- 0.010 (in 3 folds),0.911 +/- 0.063 (in 3 folds),0.791 +/- 0.107 (in 3 folds),0.911,0.772,168.0,0.0,168.0,0.0,False
lasso_multiclass,0.964 +/- 0.039 (in 3 folds),0.964 +/- 0.039 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.923 +/- 0.044 (in 3 folds),0.799 +/- 0.095 (in 3 folds),0.923,0.791,168.0,0.0,168.0,0.0,False
lasso_cv,0.962 +/- 0.040 (in 3 folds),0.962 +/- 0.040 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.815 +/- 0.028 (in 3 folds),0.382 +/- 0.148 (in 3 folds),0.815,0.385,168.0,0.0,168.0,0.0,False
xgboost,0.962 +/- 0.029 (in 3 folds),0.962 +/- 0.029 (in 3 folds),0.987 +/- 0.008 (in 3 folds),0.987 +/- 0.008 (in 3 folds),0.905 +/- 0.019 (in 3 folds),0.736 +/- 0.046 (in 3 folds),0.905,0.719,168.0,0.0,168.0,0.0,False
elasticnet_cv,0.960 +/- 0.040 (in 3 folds),0.960 +/- 0.040 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.815 +/- 0.041 (in 3 folds),0.328 +/- 0.288 (in 3 folds),0.815,0.385,168.0,0.0,168.0,0.0,False
ridge_cv,0.947 +/- 0.052 (in 3 folds),0.947 +/- 0.052 (in 3 folds),0.987 +/- 0.014 (in 3 folds),0.987 +/- 0.014 (in 3 folds),0.774 +/- 0.007 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.774,0.0,168.0,0.0,168.0,0.0,True
rf_multiclass,0.943 +/- 0.049 (in 3 folds),0.943 +/- 0.049 (in 3 folds),0.975 +/- 0.021 (in 3 folds),0.975 +/- 0.021 (in 3 folds),0.911 +/- 0.030 (in 3 folds),0.756 +/- 0.076 (in 3 folds),0.911,0.735,168.0,0.0,168.0,0.0,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.774 +/- 0.007 (in 3 folds),0.774 +/- 0.007 (in 3 folds),0.774 +/- 0.007 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.774,0.0,168.0,0.0,168.0,0.0,True
dummy_stratified,0.411 +/- 0.029 (in 3 folds),0.411 +/- 0.029 (in 3 folds),0.744 +/- 0.017 (in 3 folds),0.744 +/- 0.017 (in 3 folds),0.578 +/- 0.023 (in 3 folds),-0.174 +/- 0.060 (in 3 folds),0.577,-0.175,168.0,0.0,168.0,0.0,False
"All results, sorted",,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.964 +/- 0.039 (in 3 folds),0.964 +/- 0.039 (in 3 folds),0.991 +/- 0.010 (in 3 folds),0.991 +/- 0.010 (in 3 folds),0.911 +/- 0.063 (in 3 folds),0.791 +/- 0.107 (in 3 folds),0.911,0.772,168,0,168,0.0,False
lasso_multiclass,0.964 +/- 0.039 (in 3 folds),0.964 +/- 0.039 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.923 +/- 0.044 (in 3 folds),0.799 +/- 0.095 (in 3 folds),0.923,0.791,168,0,168,0.0,False
lasso_cv,0.962 +/- 0.040 (in 3 folds),0.962 +/- 0.040 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.815 +/- 0.028 (in 3 folds),0.382 +/- 0.148 (in 3 folds),0.815,0.385,168,0,168,0.0,False
xgboost,0.962 +/- 0.029 (in 3 folds),0.962 +/- 0.029 (in 3 folds),0.987 +/- 0.008 (in 3 folds),0.987 +/- 0.008 (in 3 folds),0.905 +/- 0.019 (in 3 folds),0.736 +/- 0.046 (in 3 folds),0.905,0.719,168,0,168,0.0,False
elasticnet_cv,0.960 +/- 0.040 (in 3 folds),0.960 +/- 0.040 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.990 +/- 0.010 (in 3 folds),0.815 +/- 0.041 (in 3 folds),0.328 +/- 0.288 (in 3 folds),0.815,0.385,168,0,168,0.0,False
ridge_cv,0.947 +/- 0.052 (in 3 folds),0.947 +/- 0.052 (in 3 folds),0.987 +/- 0.014 (in 3 folds),0.987 +/- 0.014 (in 3 folds),0.774 +/- 0.007 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.774,0.0,168,0,168,0.0,True
rf_multiclass,0.943 +/- 0.049 (in 3 folds),0.943 +/- 0.049 (in 3 folds),0.975 +/- 0.021 (in 3 folds),0.975 +/- 0.021 (in 3 folds),0.911 +/- 0.030 (in 3 folds),0.756 +/- 0.076 (in 3 folds),0.911,0.735,168,0,168,0.0,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.774 +/- 0.007 (in 3 folds),0.774 +/- 0.007 (in 3 folds),0.774 +/- 0.007 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.774,0.0,168,0,168,0.0,True
dummy_stratified,0.411 +/- 0.029 (in 3 folds),0.411 +/- 0.029 (in 3 folds),0.744 +/- 0.017 (in 3 folds),0.744 +/- 0.017 (in 3 folds),0.578 +/- 0.023 (in 3 folds),-0.174 +/- 0.060 (in 3 folds),0.577,-0.175,168,0,168,0.0,False


linearsvm_ovr,lasso_multiclass,lasso_cv,xgboost
Per-fold scores: ROC-AUC (weighted OvO): 0.964 +/- 0.039 (in 3 folds) ROC-AUC (macro OvO): 0.964 +/- 0.039 (in 3 folds) au-PRC (weighted OvO): 0.991 +/- 0.010 (in 3 folds) au-PRC (macro OvO): 0.991 +/- 0.010 (in 3 folds) Accuracy: 0.911 +/- 0.063 (in 3 folds) MCC: 0.791 +/- 0.107 (in 3 folds) Global scores: Accuracy: 0.911 MCC: 0.772 Global classification report:  precision recall f1-score support  Covid19 0.74 0.92 0.82 38 Healthy/Background 0.98 0.91 0.94 130  accuracy 0.91 168  macro avg 0.86 0.91 0.88 168  weighted avg 0.92 0.91 0.91 168,Per-fold scores: ROC-AUC (weighted OvO): 0.964 +/- 0.039 (in 3 folds) ROC-AUC (macro OvO): 0.964 +/- 0.039 (in 3 folds) au-PRC (weighted OvO): 0.990 +/- 0.010 (in 3 folds) au-PRC (macro OvO): 0.990 +/- 0.010 (in 3 folds) Accuracy: 0.923 +/- 0.044 (in 3 folds) MCC: 0.799 +/- 0.095 (in 3 folds) Global scores: Accuracy: 0.923 MCC: 0.791 Global classification report:  precision recall f1-score support  Covid19 0.79 0.89 0.84 38 Healthy/Background 0.97 0.93 0.95 130  accuracy 0.92 168  macro avg 0.88 0.91 0.89 168  weighted avg 0.93 0.92 0.92 168,Per-fold scores: ROC-AUC (weighted OvO): 0.962 +/- 0.040 (in 3 folds) ROC-AUC (macro OvO): 0.962 +/- 0.040 (in 3 folds) au-PRC (weighted OvO): 0.990 +/- 0.010 (in 3 folds) au-PRC (macro OvO): 0.990 +/- 0.010 (in 3 folds) Accuracy: 0.815 +/- 0.028 (in 3 folds) MCC: 0.382 +/- 0.148 (in 3 folds) Global scores: Accuracy: 0.815 MCC: 0.385 Global classification report:  precision recall f1-score support  Covid19 0.71 0.32 0.44 38 Healthy/Background 0.83 0.96 0.89 130  accuracy 0.82 168  macro avg 0.77 0.64 0.66 168  weighted avg 0.80 0.82 0.79 168,Per-fold scores: ROC-AUC (weighted OvO): 0.962 +/- 0.029 (in 3 folds) ROC-AUC (macro OvO): 0.962 +/- 0.029 (in 3 folds) au-PRC (weighted OvO): 0.987 +/- 0.008 (in 3 folds) au-PRC (macro OvO): 0.987 +/- 0.008 (in 3 folds) Accuracy: 0.905 +/- 0.019 (in 3 folds) MCC: 0.736 +/- 0.046 (in 3 folds) Global scores: Accuracy: 0.905 MCC: 0.719 Global classification report:  precision recall f1-score support  Covid19 0.82 0.74 0.78 38 Healthy/Background 0.93 0.95 0.94 130  accuracy 0.90 168  macro avg 0.87 0.85 0.86 168  weighted avg 0.90 0.90 0.90 168
,,,


elasticnet_cv,ridge_cv,rf_multiclass,dummy_most_frequent
Per-fold scores: ROC-AUC (weighted OvO): 0.960 +/- 0.040 (in 3 folds) ROC-AUC (macro OvO): 0.960 +/- 0.040 (in 3 folds) au-PRC (weighted OvO): 0.990 +/- 0.010 (in 3 folds) au-PRC (macro OvO): 0.990 +/- 0.010 (in 3 folds) Accuracy: 0.815 +/- 0.041 (in 3 folds) MCC: 0.328 +/- 0.288 (in 3 folds) Global scores: Accuracy: 0.815 MCC: 0.385 Global classification report:  precision recall f1-score support  Covid19 0.71 0.32 0.44 38 Healthy/Background 0.83 0.96 0.89 130  accuracy 0.82 168  macro avg 0.77 0.64 0.66 168  weighted avg 0.80 0.82 0.79 168,Per-fold scores: ROC-AUC (weighted OvO): 0.947 +/- 0.052 (in 3 folds) ROC-AUC (macro OvO): 0.947 +/- 0.052 (in 3 folds) au-PRC (weighted OvO): 0.987 +/- 0.014 (in 3 folds) au-PRC (macro OvO): 0.987 +/- 0.014 (in 3 folds) Accuracy: 0.774 +/- 0.007 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores: Accuracy: 0.774 MCC: 0.000 Global classification report:  precision recall f1-score support  Covid19 0.00 0.00 0.00 38 Healthy/Background 0.77 1.00 0.87 130  accuracy 0.77 168  macro avg 0.39 0.50 0.44 168  weighted avg 0.60 0.77 0.68 168,Per-fold scores: ROC-AUC (weighted OvO): 0.943 +/- 0.049 (in 3 folds) ROC-AUC (macro OvO): 0.943 +/- 0.049 (in 3 folds) au-PRC (weighted OvO): 0.975 +/- 0.021 (in 3 folds) au-PRC (macro OvO): 0.975 +/- 0.021 (in 3 folds) Accuracy: 0.911 +/- 0.030 (in 3 folds) MCC: 0.756 +/- 0.076 (in 3 folds) Global scores: Accuracy: 0.911 MCC: 0.735 Global classification report:  precision recall f1-score support  Covid19 0.85 0.74 0.79 38 Healthy/Background 0.93 0.96 0.94 130  accuracy 0.91 168  macro avg 0.89 0.85 0.87 168  weighted avg 0.91 0.91 0.91 168,Per-fold scores: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.774 +/- 0.007 (in 3 folds) au-PRC (macro OvO): 0.774 +/- 0.007 (in 3 folds) Accuracy: 0.774 +/- 0.007 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores: Accuracy: 0.774 MCC: 0.000 Global classification report:  precision recall f1-score support  Covid19 0.00 0.00 0.00 38 Healthy/Background 0.77 1.00 0.87 130  accuracy 0.77 168  macro avg 0.39 0.50 0.44 168  weighted avg 0.60 0.77 0.68 168
,,,


dummy_stratified
Per-fold scores: ROC-AUC (weighted OvO): 0.411 +/- 0.029 (in 3 folds) ROC-AUC (macro OvO): 0.411 +/- 0.029 (in 3 folds) au-PRC (weighted OvO): 0.744 +/- 0.017 (in 3 folds) au-PRC (macro OvO): 0.744 +/- 0.017 (in 3 folds) Accuracy: 0.578 +/- 0.023 (in 3 folds) MCC: -0.174 +/- 0.060 (in 3 folds) Global scores: Accuracy: 0.577 MCC: -0.175 Global classification report:  precision recall f1-score support  Covid19 0.10 0.11 0.10 38 Healthy/Background 0.73 0.72 0.72 130  accuracy 0.58 168  macro avg 0.41 0.41 0.41 168  weighted avg 0.59 0.58 0.58 168


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.955 +/- 0.002 (in 3 folds),0.955 +/- 0.002 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.893 +/- 0.013 (in 3 folds),0.729 +/- 0.048 (in 3 folds),0.893,0.726,disease.separate_past_exposures,252.0,0.0,252.0,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.955 +/- 0.002 (in 3 folds),0.955 +/- 0.002 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.897 +/- 0.008 (in 3 folds),0.759 +/- 0.009 (in 3 folds),0.897,0.755,disease.separate_past_exposures,252.0,0.0,252.0,0.0,False
linearsvm_ovr,0.955 +/- 0.001 (in 3 folds),0.955 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.881 +/- 0.025 (in 3 folds),0.720 +/- 0.025 (in 3 folds),0.881,0.715,disease.separate_past_exposures,252.0,0.0,252.0,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.955 +/- 0.001 (in 3 folds),0.955 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.889 +/- 0.015 (in 3 folds),0.720 +/- 0.031 (in 3 folds),0.889,0.718,disease.separate_past_exposures,252.0,0.0,252.0,0.0,False
xgboost,0.953 +/- 0.009 (in 3 folds),0.953 +/- 0.009 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.889 +/- 0.029 (in 3 folds),0.675 +/- 0.085 (in 3 folds),0.889,0.674,disease.separate_past_exposures,252.0,0.0,252.0,0.0,False
xgboost.decision_thresholds_tuned,0.953 +/- 0.009 (in 3 folds),0.953 +/- 0.009 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.877 +/- 0.017 (in 3 folds),0.671 +/- 0.075 (in 3 folds),0.877,0.669,disease.separate_past_exposures,252.0,0.0,252.0,0.0,False
ridge_cv,0.952 +/- 0.012 (in 3 folds),0.952 +/- 0.012 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.770 +/- 0.005 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.77,0.0,disease.separate_past_exposures,252.0,0.0,252.0,0.0,True
ridge_cv.decision_thresholds_tuned,0.952 +/- 0.012 (in 3 folds),0.952 +/- 0.012 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.825 +/- 0.091 (in 3 folds),0.274 +/- 0.475 (in 3 folds),0.825,0.433,disease.separate_past_exposures,252.0,0.0,252.0,0.0,False
lasso_cv,0.951 +/- 0.013 (in 3 folds),0.951 +/- 0.013 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.826 +/- 0.057 (in 3 folds),0.411 +/- 0.244 (in 3 folds),0.825,0.434,disease.separate_past_exposures,252.0,0.0,252.0,0.0,False
lasso_cv.decision_thresholds_tuned,0.951 +/- 0.013 (in 3 folds),0.951 +/- 0.013 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.909 +/- 0.019 (in 3 folds),0.791 +/- 0.030 (in 3 folds),0.909,0.789,disease.separate_past_exposures,252.0,0.0,252.0,0.0,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
lasso_multiclass,0.955 +/- 0.002 (in 3 folds),0.955 +/- 0.002 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.893 +/- 0.013 (in 3 folds),0.729 +/- 0.048 (in 3 folds),0.893,0.726,disease.separate_past_exposures,252,0,252,0.0,False
lasso_multiclass.decision_thresholds_tuned,0.955 +/- 0.002 (in 3 folds),0.955 +/- 0.002 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.987 +/- 0.001 (in 3 folds),0.897 +/- 0.008 (in 3 folds),0.759 +/- 0.009 (in 3 folds),0.897,0.755,disease.separate_past_exposures,252,0,252,0.0,False
linearsvm_ovr,0.955 +/- 0.001 (in 3 folds),0.955 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.881 +/- 0.025 (in 3 folds),0.720 +/- 0.025 (in 3 folds),0.881,0.715,disease.separate_past_exposures,252,0,252,0.0,False
linearsvm_ovr.decision_thresholds_tuned,0.955 +/- 0.001 (in 3 folds),0.955 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.988 +/- 0.001 (in 3 folds),0.889 +/- 0.015 (in 3 folds),0.720 +/- 0.031 (in 3 folds),0.889,0.718,disease.separate_past_exposures,252,0,252,0.0,False
xgboost,0.953 +/- 0.009 (in 3 folds),0.953 +/- 0.009 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.889 +/- 0.029 (in 3 folds),0.675 +/- 0.085 (in 3 folds),0.889,0.674,disease.separate_past_exposures,252,0,252,0.0,False
xgboost.decision_thresholds_tuned,0.953 +/- 0.009 (in 3 folds),0.953 +/- 0.009 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.985 +/- 0.003 (in 3 folds),0.877 +/- 0.017 (in 3 folds),0.671 +/- 0.075 (in 3 folds),0.877,0.669,disease.separate_past_exposures,252,0,252,0.0,False
ridge_cv,0.952 +/- 0.012 (in 3 folds),0.952 +/- 0.012 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.770 +/- 0.005 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.77,0.0,disease.separate_past_exposures,252,0,252,0.0,True
ridge_cv.decision_thresholds_tuned,0.952 +/- 0.012 (in 3 folds),0.952 +/- 0.012 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.825 +/- 0.091 (in 3 folds),0.274 +/- 0.475 (in 3 folds),0.825,0.433,disease.separate_past_exposures,252,0,252,0.0,False
lasso_cv,0.951 +/- 0.013 (in 3 folds),0.951 +/- 0.013 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.826 +/- 0.057 (in 3 folds),0.411 +/- 0.244 (in 3 folds),0.825,0.434,disease.separate_past_exposures,252,0,252,0.0,False
lasso_cv.decision_thresholds_tuned,0.951 +/- 0.013 (in 3 folds),0.951 +/- 0.013 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.987 +/- 0.003 (in 3 folds),0.909 +/- 0.019 (in 3 folds),0.791 +/- 0.030 (in 3 folds),0.909,0.789,disease.separate_past_exposures,252,0,252,0.0,False


lasso_multiclass,lasso_multiclass.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores: ROC-AUC (weighted OvO): 0.955 +/- 0.002 (in 3 folds) ROC-AUC (macro OvO): 0.955 +/- 0.002 (in 3 folds) au-PRC (weighted OvO): 0.987 +/- 0.001 (in 3 folds) au-PRC (macro OvO): 0.987 +/- 0.001 (in 3 folds) Accuracy: 0.893 +/- 0.013 (in 3 folds) MCC: 0.729 +/- 0.048 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.893 MCC: 0.726 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.72 0.88 0.79 58 Healthy/Background 0.96 0.90 0.93 194  accuracy 0.89 252  macro avg 0.84 0.89 0.86 252  weighted avg 0.91 0.89 0.90 252,Per-fold scores: ROC-AUC (weighted OvO): 0.955 +/- 0.002 (in 3 folds) ROC-AUC (macro OvO): 0.955 +/- 0.002 (in 3 folds) au-PRC (weighted OvO): 0.987 +/- 0.001 (in 3 folds) au-PRC (macro OvO): 0.987 +/- 0.001 (in 3 folds) Accuracy: 0.897 +/- 0.008 (in 3 folds) MCC: 0.759 +/- 0.009 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.897 MCC: 0.755 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.71 0.95 0.81 58 Healthy/Background 0.98 0.88 0.93 194  accuracy 0.90 252  macro avg 0.84 0.91 0.87 252  weighted avg 0.92 0.90 0.90 252,Per-fold scores: ROC-AUC (weighted OvO): 0.955 +/- 0.001 (in 3 folds) ROC-AUC (macro OvO): 0.955 +/- 0.001 (in 3 folds) au-PRC (weighted OvO): 0.988 +/- 0.001 (in 3 folds) au-PRC (macro OvO): 0.988 +/- 0.001 (in 3 folds) Accuracy: 0.881 +/- 0.025 (in 3 folds) MCC: 0.720 +/- 0.025 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.881 MCC: 0.715 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.68 0.91 0.78 58 Healthy/Background 0.97 0.87 0.92 194  accuracy 0.88 252  macro avg 0.83 0.89 0.85 252  weighted avg 0.90 0.88 0.89 252,Per-fold scores: ROC-AUC (weighted OvO): 0.955 +/- 0.001 (in 3 folds) ROC-AUC (macro OvO): 0.955 +/- 0.001 (in 3 folds) au-PRC (weighted OvO): 0.988 +/- 0.001 (in 3 folds) au-PRC (macro OvO): 0.988 +/- 0.001 (in 3 folds) Accuracy: 0.889 +/- 0.015 (in 3 folds) MCC: 0.720 +/- 0.031 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.889 MCC: 0.718 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.71 0.88 0.78 58 Healthy/Background 0.96 0.89 0.93 194  accuracy 0.89 252  macro avg 0.83 0.89 0.85 252  weighted avg 0.90 0.89 0.89 252
,,,


xgboost,xgboost.decision_thresholds_tuned,ridge_cv,ridge_cv.decision_thresholds_tuned
Per-fold scores: ROC-AUC (weighted OvO): 0.953 +/- 0.009 (in 3 folds) ROC-AUC (macro OvO): 0.953 +/- 0.009 (in 3 folds) au-PRC (weighted OvO): 0.985 +/- 0.003 (in 3 folds) au-PRC (macro OvO): 0.985 +/- 0.003 (in 3 folds) Accuracy: 0.889 +/- 0.029 (in 3 folds) MCC: 0.675 +/- 0.085 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.889 MCC: 0.674 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.80 0.69 0.74 58 Healthy/Background 0.91 0.95 0.93 194  accuracy 0.89 252  macro avg 0.86 0.82 0.84 252  weighted avg 0.89 0.89 0.89 252,Per-fold scores: ROC-AUC (weighted OvO): 0.953 +/- 0.009 (in 3 folds) ROC-AUC (macro OvO): 0.953 +/- 0.009 (in 3 folds) au-PRC (weighted OvO): 0.985 +/- 0.003 (in 3 folds) au-PRC (macro OvO): 0.985 +/- 0.003 (in 3 folds) Accuracy: 0.877 +/- 0.017 (in 3 folds) MCC: 0.671 +/- 0.075 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.877 MCC: 0.669 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.71 0.79 0.75 58 Healthy/Background 0.94 0.90 0.92 194  accuracy 0.88 252  macro avg 0.82 0.85 0.83 252  weighted avg 0.88 0.88 0.88 252,Per-fold scores: ROC-AUC (weighted OvO): 0.952 +/- 0.012 (in 3 folds) ROC-AUC (macro OvO): 0.952 +/- 0.012 (in 3 folds) au-PRC (weighted OvO): 0.987 +/- 0.003 (in 3 folds) au-PRC (macro OvO): 0.987 +/- 0.003 (in 3 folds) Accuracy: 0.770 +/- 0.005 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.770 MCC: 0.000 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.00 0.00 0.00 58 Healthy/Background 0.77 1.00 0.87 194  accuracy 0.77 252  macro avg 0.38 0.50 0.43 252  weighted avg 0.59 0.77 0.67 252,Per-fold scores: ROC-AUC (weighted OvO): 0.952 +/- 0.012 (in 3 folds) ROC-AUC (macro OvO): 0.952 +/- 0.012 (in 3 folds) au-PRC (weighted OvO): 0.987 +/- 0.003 (in 3 folds) au-PRC (macro OvO): 0.987 +/- 0.003 (in 3 folds) Accuracy: 0.825 +/- 0.091 (in 3 folds) MCC: 0.274 +/- 0.475 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.825 MCC: 0.433 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.79 0.33 0.46 58 Healthy/Background 0.83 0.97 0.90 194  accuracy 0.83 252  macro avg 0.81 0.65 0.68 252  weighted avg 0.82 0.83 0.80 252
,,,


lasso_cv,lasso_cv.decision_thresholds_tuned,elasticnet_cv,elasticnet_cv.decision_thresholds_tuned
Per-fold scores: ROC-AUC (weighted OvO): 0.951 +/- 0.013 (in 3 folds) ROC-AUC (macro OvO): 0.951 +/- 0.013 (in 3 folds) au-PRC (weighted OvO): 0.987 +/- 0.003 (in 3 folds) au-PRC (macro OvO): 0.987 +/- 0.003 (in 3 folds) Accuracy: 0.826 +/- 0.057 (in 3 folds) MCC: 0.411 +/- 0.244 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.825 MCC: 0.434 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.77 0.34 0.48 58 Healthy/Background 0.83 0.97 0.90 194  accuracy 0.83 252  macro avg 0.80 0.66 0.69 252  weighted avg 0.82 0.83 0.80 252,Per-fold scores: ROC-AUC (weighted OvO): 0.951 +/- 0.013 (in 3 folds) ROC-AUC (macro OvO): 0.951 +/- 0.013 (in 3 folds) au-PRC (weighted OvO): 0.987 +/- 0.003 (in 3 folds) au-PRC (macro OvO): 0.987 +/- 0.003 (in 3 folds) Accuracy: 0.909 +/- 0.019 (in 3 folds) MCC: 0.791 +/- 0.030 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.909 MCC: 0.789 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.72 0.98 0.83 58 Healthy/Background 0.99 0.89 0.94 194  accuracy 0.91 252  macro avg 0.86 0.93 0.88 252  weighted avg 0.93 0.91 0.91 252,Per-fold scores: ROC-AUC (weighted OvO): 0.951 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.951 +/- 0.011 (in 3 folds) au-PRC (weighted OvO): 0.987 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.987 +/- 0.002 (in 3 folds) Accuracy: 0.822 +/- 0.062 (in 3 folds) MCC: 0.343 +/- 0.339 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.821 MCC: 0.418 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.76 0.33 0.46 58 Healthy/Background 0.83 0.97 0.89 194  accuracy 0.82 252  macro avg 0.79 0.65 0.68 252  weighted avg 0.81 0.82 0.79 252,Per-fold scores: ROC-AUC (weighted OvO): 0.951 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.951 +/- 0.011 (in 3 folds) au-PRC (weighted OvO): 0.987 +/- 0.002 (in 3 folds) au-PRC (macro OvO): 0.987 +/- 0.002 (in 3 folds) Accuracy: 0.909 +/- 0.019 (in 3 folds) MCC: 0.791 +/- 0.030 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.909 MCC: 0.789 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.72 0.98 0.83 58 Healthy/Background 0.99 0.89 0.94 194  accuracy 0.91 252  macro avg 0.86 0.93 0.88 252  weighted avg 0.93 0.91 0.91 252
,,,


rf_multiclass,rf_multiclass.decision_thresholds_tuned
Per-fold scores: ROC-AUC (weighted OvO): 0.933 +/- 0.045 (in 3 folds) ROC-AUC (macro OvO): 0.933 +/- 0.045 (in 3 folds) au-PRC (weighted OvO): 0.973 +/- 0.026 (in 3 folds) au-PRC (macro OvO): 0.973 +/- 0.026 (in 3 folds) Accuracy: 0.869 +/- 0.021 (in 3 folds) MCC: 0.623 +/- 0.050 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.869 MCC: 0.620 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.74 0.67 0.70 58 Healthy/Background 0.90 0.93 0.92 194  accuracy 0.87 252  macro avg 0.82 0.80 0.81 252  weighted avg 0.87 0.87 0.87 252,Per-fold scores: ROC-AUC (weighted OvO): 0.933 +/- 0.045 (in 3 folds) ROC-AUC (macro OvO): 0.933 +/- 0.045 (in 3 folds) au-PRC (weighted OvO): 0.973 +/- 0.026 (in 3 folds) au-PRC (macro OvO): 0.973 +/- 0.026 (in 3 folds) Accuracy: 0.881 +/- 0.025 (in 3 folds) MCC: 0.694 +/- 0.083 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.881 MCC: 0.692 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  Covid19 0.70 0.84 0.77 58 Healthy/Background 0.95 0.89 0.92 194  accuracy 0.88 252  macro avg 0.83 0.87 0.84 252  weighted avg 0.89 0.88 0.88 252
,


---

# GeneLocus.TCR, TargetObsColumnEnum.hiv_vs_healthy trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.881 +/- 0.023 (in 3 folds),0.881 +/- 0.023 (in 3 folds),0.942 +/- 0.009 (in 3 folds),0.942 +/- 0.009 (in 3 folds),0.783 +/- 0.017 (in 3 folds),0.529 +/- 0.028 (in 3 folds),0.784,0.5,194.0,0.0,194.0,0.0,False
lasso_multiclass,0.873 +/- 0.023 (in 3 folds),0.873 +/- 0.023 (in 3 folds),0.939 +/- 0.007 (in 3 folds),0.939 +/- 0.007 (in 3 folds),0.768 +/- 0.017 (in 3 folds),0.511 +/- 0.015 (in 3 folds),0.768,0.506,194.0,0.0,194.0,0.0,False
lasso_cv,0.857 +/- 0.011 (in 3 folds),0.857 +/- 0.011 (in 3 folds),0.934 +/- 0.004 (in 3 folds),0.934 +/- 0.004 (in 3 folds),0.773 +/- 0.017 (in 3 folds),0.465 +/- 0.061 (in 3 folds),0.773,0.462,194.0,0.0,194.0,0.0,False
elasticnet_cv,0.854 +/- 0.012 (in 3 folds),0.854 +/- 0.012 (in 3 folds),0.933 +/- 0.005 (in 3 folds),0.933 +/- 0.005 (in 3 folds),0.768 +/- 0.016 (in 3 folds),0.451 +/- 0.051 (in 3 folds),0.768,0.448,194.0,0.0,194.0,0.0,False
ridge_cv,0.853 +/- 0.045 (in 3 folds),0.853 +/- 0.045 (in 3 folds),0.930 +/- 0.016 (in 3 folds),0.930 +/- 0.016 (in 3 folds),0.696 +/- 0.047 (in 3 folds),0.132 +/- 0.228 (in 3 folds),0.696,0.217,194.0,0.0,194.0,0.0,False
xgboost,0.853 +/- 0.013 (in 3 folds),0.853 +/- 0.013 (in 3 folds),0.924 +/- 0.008 (in 3 folds),0.924 +/- 0.008 (in 3 folds),0.778 +/- 0.022 (in 3 folds),0.500 +/- 0.071 (in 3 folds),0.778,0.497,194.0,0.0,194.0,0.0,False
rf_multiclass,0.839 +/- 0.004 (in 3 folds),0.839 +/- 0.004 (in 3 folds),0.904 +/- 0.011 (in 3 folds),0.904 +/- 0.011 (in 3 folds),0.778 +/- 0.016 (in 3 folds),0.523 +/- 0.076 (in 3 folds),0.778,0.519,194.0,0.0,194.0,0.0,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.670 +/- 0.008 (in 3 folds),0.670 +/- 0.008 (in 3 folds),0.670 +/- 0.008 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.67,0.0,194.0,0.0,194.0,0.0,True
dummy_stratified,0.467 +/- 0.016 (in 3 folds),0.467 +/- 0.016 (in 3 folds),0.656 +/- 0.003 (in 3 folds),0.656 +/- 0.003 (in 3 folds),0.541 +/- 0.012 (in 3 folds),-0.068 +/- 0.032 (in 3 folds),0.541,-0.067,194.0,0.0,194.0,0.0,False
"All results, sorted",,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.881 +/- 0.023 (in 3 folds),0.881 +/- 0.023 (in 3 folds),0.942 +/- 0.009 (in 3 folds),0.942 +/- 0.009 (in 3 folds),0.783 +/- 0.017 (in 3 folds),0.529 +/- 0.028 (in 3 folds),0.784,0.5,194,0,194,0.0,False
lasso_multiclass,0.873 +/- 0.023 (in 3 folds),0.873 +/- 0.023 (in 3 folds),0.939 +/- 0.007 (in 3 folds),0.939 +/- 0.007 (in 3 folds),0.768 +/- 0.017 (in 3 folds),0.511 +/- 0.015 (in 3 folds),0.768,0.506,194,0,194,0.0,False
lasso_cv,0.857 +/- 0.011 (in 3 folds),0.857 +/- 0.011 (in 3 folds),0.934 +/- 0.004 (in 3 folds),0.934 +/- 0.004 (in 3 folds),0.773 +/- 0.017 (in 3 folds),0.465 +/- 0.061 (in 3 folds),0.773,0.462,194,0,194,0.0,False
elasticnet_cv,0.854 +/- 0.012 (in 3 folds),0.854 +/- 0.012 (in 3 folds),0.933 +/- 0.005 (in 3 folds),0.933 +/- 0.005 (in 3 folds),0.768 +/- 0.016 (in 3 folds),0.451 +/- 0.051 (in 3 folds),0.768,0.448,194,0,194,0.0,False
ridge_cv,0.853 +/- 0.045 (in 3 folds),0.853 +/- 0.045 (in 3 folds),0.930 +/- 0.016 (in 3 folds),0.930 +/- 0.016 (in 3 folds),0.696 +/- 0.047 (in 3 folds),0.132 +/- 0.228 (in 3 folds),0.696,0.217,194,0,194,0.0,False
xgboost,0.853 +/- 0.013 (in 3 folds),0.853 +/- 0.013 (in 3 folds),0.924 +/- 0.008 (in 3 folds),0.924 +/- 0.008 (in 3 folds),0.778 +/- 0.022 (in 3 folds),0.500 +/- 0.071 (in 3 folds),0.778,0.497,194,0,194,0.0,False
rf_multiclass,0.839 +/- 0.004 (in 3 folds),0.839 +/- 0.004 (in 3 folds),0.904 +/- 0.011 (in 3 folds),0.904 +/- 0.011 (in 3 folds),0.778 +/- 0.016 (in 3 folds),0.523 +/- 0.076 (in 3 folds),0.778,0.519,194,0,194,0.0,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.670 +/- 0.008 (in 3 folds),0.670 +/- 0.008 (in 3 folds),0.670 +/- 0.008 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.67,0.0,194,0,194,0.0,True
dummy_stratified,0.467 +/- 0.016 (in 3 folds),0.467 +/- 0.016 (in 3 folds),0.656 +/- 0.003 (in 3 folds),0.656 +/- 0.003 (in 3 folds),0.541 +/- 0.012 (in 3 folds),-0.068 +/- 0.032 (in 3 folds),0.541,-0.067,194,0,194,0.0,False


linearsvm_ovr,lasso_multiclass,lasso_cv,elasticnet_cv
Per-fold scores: ROC-AUC (weighted OvO): 0.881 +/- 0.023 (in 3 folds) ROC-AUC (macro OvO): 0.881 +/- 0.023 (in 3 folds) au-PRC (weighted OvO): 0.942 +/- 0.009 (in 3 folds) au-PRC (macro OvO): 0.942 +/- 0.009 (in 3 folds) Accuracy: 0.783 +/- 0.017 (in 3 folds) MCC: 0.529 +/- 0.028 (in 3 folds) Global scores: Accuracy: 0.784 MCC: 0.500 Global classification report:  precision recall f1-score support  HIV 0.69 0.62 0.66 64 Healthy/Background 0.82 0.86 0.84 130  accuracy 0.78 194  macro avg 0.76 0.74 0.75 194  weighted avg 0.78 0.78 0.78 194,Per-fold scores: ROC-AUC (weighted OvO): 0.873 +/- 0.023 (in 3 folds) ROC-AUC (macro OvO): 0.873 +/- 0.023 (in 3 folds) au-PRC (weighted OvO): 0.939 +/- 0.007 (in 3 folds) au-PRC (macro OvO): 0.939 +/- 0.007 (in 3 folds) Accuracy: 0.768 +/- 0.017 (in 3 folds) MCC: 0.511 +/- 0.015 (in 3 folds) Global scores: Accuracy: 0.768 MCC: 0.506 Global classification report:  precision recall f1-score support  HIV 0.62 0.75 0.68 64 Healthy/Background 0.86 0.78 0.82 130  accuracy 0.77 194  macro avg 0.74 0.76 0.75 194  weighted avg 0.78 0.77 0.77 194,Per-fold scores: ROC-AUC (weighted OvO): 0.857 +/- 0.011 (in 3 folds) ROC-AUC (macro OvO): 0.857 +/- 0.011 (in 3 folds) au-PRC (weighted OvO): 0.934 +/- 0.004 (in 3 folds) au-PRC (macro OvO): 0.934 +/- 0.004 (in 3 folds) Accuracy: 0.773 +/- 0.017 (in 3 folds) MCC: 0.465 +/- 0.061 (in 3 folds) Global scores: Accuracy: 0.773 MCC: 0.462 Global classification report:  precision recall f1-score support  HIV 0.71 0.53 0.61 64 Healthy/Background 0.79 0.89 0.84 130  accuracy 0.77 194  macro avg 0.75 0.71 0.72 194  weighted avg 0.77 0.77 0.76 194,Per-fold scores: ROC-AUC (weighted OvO): 0.854 +/- 0.012 (in 3 folds) ROC-AUC (macro OvO): 0.854 +/- 0.012 (in 3 folds) au-PRC (weighted OvO): 0.933 +/- 0.005 (in 3 folds) au-PRC (macro OvO): 0.933 +/- 0.005 (in 3 folds) Accuracy: 0.768 +/- 0.016 (in 3 folds) MCC: 0.451 +/- 0.051 (in 3 folds) Global scores: Accuracy: 0.768 MCC: 0.448 Global classification report:  precision recall f1-score support  HIV 0.70 0.52 0.59 64 Healthy/Background 0.79 0.89 0.84 130  accuracy 0.77 194  macro avg 0.75 0.70 0.72 194  weighted avg 0.76 0.77 0.76 194
,,,


ridge_cv,xgboost,rf_multiclass,dummy_most_frequent
Per-fold scores: ROC-AUC (weighted OvO): 0.853 +/- 0.045 (in 3 folds) ROC-AUC (macro OvO): 0.853 +/- 0.045 (in 3 folds) au-PRC (weighted OvO): 0.930 +/- 0.016 (in 3 folds) au-PRC (macro OvO): 0.930 +/- 0.016 (in 3 folds) Accuracy: 0.696 +/- 0.047 (in 3 folds) MCC: 0.132 +/- 0.228 (in 3 folds) Global scores: Accuracy: 0.696 MCC: 0.217 Global classification report:  precision recall f1-score support  HIV 0.86 0.09 0.17 64 Healthy/Background 0.69 0.99 0.81 130  accuracy 0.70 194  macro avg 0.77 0.54 0.49 194  weighted avg 0.75 0.70 0.60 194,Per-fold scores: ROC-AUC (weighted OvO): 0.853 +/- 0.013 (in 3 folds) ROC-AUC (macro OvO): 0.853 +/- 0.013 (in 3 folds) au-PRC (weighted OvO): 0.924 +/- 0.008 (in 3 folds) au-PRC (macro OvO): 0.924 +/- 0.008 (in 3 folds) Accuracy: 0.778 +/- 0.022 (in 3 folds) MCC: 0.500 +/- 0.071 (in 3 folds) Global scores: Accuracy: 0.778 MCC: 0.497 Global classification report:  precision recall f1-score support  HIV 0.67 0.66 0.66 64 Healthy/Background 0.83 0.84 0.84 130  accuracy 0.78 194  macro avg 0.75 0.75 0.75 194  weighted avg 0.78 0.78 0.78 194,Per-fold scores: ROC-AUC (weighted OvO): 0.839 +/- 0.004 (in 3 folds) ROC-AUC (macro OvO): 0.839 +/- 0.004 (in 3 folds) au-PRC (weighted OvO): 0.904 +/- 0.011 (in 3 folds) au-PRC (macro OvO): 0.904 +/- 0.011 (in 3 folds) Accuracy: 0.778 +/- 0.016 (in 3 folds) MCC: 0.523 +/- 0.076 (in 3 folds) Global scores: Accuracy: 0.778 MCC: 0.519 Global classification report:  precision recall f1-score support  HIV 0.64 0.73 0.69 64 Healthy/Background 0.86 0.80 0.83 130  accuracy 0.78 194  macro avg 0.75 0.77 0.76 194  weighted avg 0.79 0.78 0.78 194,Per-fold scores: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.670 +/- 0.008 (in 3 folds) au-PRC (macro OvO): 0.670 +/- 0.008 (in 3 folds) Accuracy: 0.670 +/- 0.008 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores: Accuracy: 0.670 MCC: 0.000 Global classification report:  precision recall f1-score support  HIV 0.00 0.00 0.00 64 Healthy/Background 0.67 1.00 0.80 130  accuracy 0.67 194  macro avg 0.34 0.50 0.40 194  weighted avg 0.45 0.67 0.54 194
,,,


dummy_stratified
Per-fold scores: ROC-AUC (weighted OvO): 0.467 +/- 0.016 (in 3 folds) ROC-AUC (macro OvO): 0.467 +/- 0.016 (in 3 folds) au-PRC (weighted OvO): 0.656 +/- 0.003 (in 3 folds) au-PRC (macro OvO): 0.656 +/- 0.003 (in 3 folds) Accuracy: 0.541 +/- 0.012 (in 3 folds) MCC: -0.068 +/- 0.032 (in 3 folds) Global scores: Accuracy: 0.541 MCC: -0.067 Global classification report:  precision recall f1-score support  HIV 0.28 0.25 0.26 64 Healthy/Background 0.65 0.68 0.67 130  accuracy 0.54 194  macro avg 0.47 0.47 0.47 194  weighted avg 0.53 0.54 0.53 194


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.894 +/- 0.048 (in 3 folds),0.894 +/- 0.048 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.780 +/- 0.017 (in 3 folds),0.518 +/- 0.070 (in 3 folds),0.78,0.488,disease.separate_past_exposures,0.777 +/- 0.015 (in 3 folds),0.513 +/- 0.063 (in 3 folds),0.010 +/- 0.000 (in 1 folds),0.915 +/- 0.046 (in 2 folds),0.915 +/- 0.046 (in 2 folds),0.962 +/- 0.019 (in 2 folds),0.962 +/- 0.019 (in 2 folds),0.777,0.485,0.003,Unknown,disease.separate_past_exposures,291.0,1.0,292.0,0.003425,False
linearsvm_ovr.decision_thresholds_tuned,0.894 +/- 0.048 (in 3 folds),0.894 +/- 0.048 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.787 +/- 0.071 (in 3 folds),0.611 +/- 0.067 (in 3 folds),0.787,0.585,disease.separate_past_exposures,0.785 +/- 0.072 (in 3 folds),0.606 +/- 0.071 (in 3 folds),0.010 +/- 0.000 (in 1 folds),0.915 +/- 0.046 (in 2 folds),0.915 +/- 0.046 (in 2 folds),0.962 +/- 0.019 (in 2 folds),0.962 +/- 0.019 (in 2 folds),0.784,0.58,0.003,Unknown,disease.separate_past_exposures,291.0,1.0,292.0,0.003425,False
lasso_cv,0.890 +/- 0.031 (in 3 folds),0.890 +/- 0.031 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.774 +/- 0.039 (in 3 folds),0.468 +/- 0.102 (in 3 folds),0.774,0.466,disease.separate_past_exposures,,,,,,,,,,,,,292.0,0.0,292.0,0.0,False
lasso_cv.decision_thresholds_tuned,0.890 +/- 0.031 (in 3 folds),0.890 +/- 0.031 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.785 +/- 0.091 (in 3 folds),0.591 +/- 0.121 (in 3 folds),0.784,0.565,disease.separate_past_exposures,,,,,,,,,,,,,292.0,0.0,292.0,0.0,False
elasticnet_cv,0.887 +/- 0.035 (in 3 folds),0.887 +/- 0.035 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.781 +/- 0.041 (in 3 folds),0.482 +/- 0.109 (in 3 folds),0.781,0.483,disease.separate_past_exposures,,,,,,,,,,,,,292.0,0.0,292.0,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.887 +/- 0.035 (in 3 folds),0.887 +/- 0.035 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.785 +/- 0.086 (in 3 folds),0.586 +/- 0.129 (in 3 folds),0.784,0.561,disease.separate_past_exposures,,,,,,,,,,,,,292.0,0.0,292.0,0.0,False
lasso_multiclass,0.883 +/- 0.026 (in 3 folds),0.883 +/- 0.026 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.790 +/- 0.042 (in 3 folds),0.541 +/- 0.051 (in 3 folds),0.791,0.528,disease.separate_past_exposures,0.778 +/- 0.064 (in 3 folds),0.525 +/- 0.078 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.895 +/- 0.018 (in 2 folds),0.895 +/- 0.018 (in 2 folds),0.956 +/- 0.011 (in 2 folds),0.956 +/- 0.011 (in 2 folds),0.777,0.51,0.017,Unknown,disease.separate_past_exposures,287.0,5.0,292.0,0.017123,False
lasso_multiclass.decision_thresholds_tuned,0.883 +/- 0.026 (in 3 folds),0.883 +/- 0.026 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.784 +/- 0.046 (in 3 folds),0.548 +/- 0.111 (in 3 folds),0.784,0.543,disease.separate_past_exposures,0.771 +/- 0.065 (in 3 folds),0.535 +/- 0.133 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.895 +/- 0.018 (in 2 folds),0.895 +/- 0.018 (in 2 folds),0.956 +/- 0.011 (in 2 folds),0.956 +/- 0.011 (in 2 folds),0.771,0.524,0.017,Unknown,disease.separate_past_exposures,287.0,5.0,292.0,0.017123,False
ridge_cv,0.848 +/- 0.065 (in 3 folds),0.848 +/- 0.065 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.677 +/- 0.019 (in 3 folds),0.075 +/- 0.129 (in 3 folds),0.677,0.117,disease.separate_past_exposures,0.661 +/- 0.007 (in 3 folds),0.078 +/- 0.115 (in 3 folds),0.036 +/- 0.022 (in 2 folds),0.918 +/- 0.000 (in 1 folds),0.918 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds),0.661,0.115,0.024,Unknown,disease.separate_past_exposures,285.0,7.0,292.0,0.023973,False
ridge_cv.decision_thresholds_tuned,0.848 +/- 0.065 (in 3 folds),0.848 +/- 0.065 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.685 +/- 0.031 (in 3 folds),0.132 +/- 0.229 (in 3 folds),0.684,0.183,disease.separate_past_exposures,0.668 +/- 0.015 (in 3 folds),0.128 +/- 0.201 (in 3 folds),0.036 +/- 0.022 (in 2 folds),0.918 +/- 0.000 (in 1 folds),0.918 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds),0.668,0.177,0.024,Unknown,disease.separate_past_exposures,285.0,7.0,292.0,0.023973,False

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
linearsvm_ovr,0.894 +/- 0.048 (in 3 folds),0.894 +/- 0.048 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.780 +/- 0.017 (in 3 folds),0.518 +/- 0.070 (in 3 folds),0.78,0.488,disease.separate_past_exposures,0.777 +/- 0.015 (in 3 folds),0.513 +/- 0.063 (in 3 folds),0.010 +/- 0.000 (in 1 folds),0.915 +/- 0.046 (in 2 folds),0.915 +/- 0.046 (in 2 folds),0.962 +/- 0.019 (in 2 folds),0.962 +/- 0.019 (in 2 folds),0.777,0.485,0.003,Unknown,disease.separate_past_exposures,291,1,292,0.003425,False
linearsvm_ovr.decision_thresholds_tuned,0.894 +/- 0.048 (in 3 folds),0.894 +/- 0.048 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.953 +/- 0.021 (in 3 folds),0.787 +/- 0.071 (in 3 folds),0.611 +/- 0.067 (in 3 folds),0.787,0.585,disease.separate_past_exposures,0.785 +/- 0.072 (in 3 folds),0.606 +/- 0.071 (in 3 folds),0.010 +/- 0.000 (in 1 folds),0.915 +/- 0.046 (in 2 folds),0.915 +/- 0.046 (in 2 folds),0.962 +/- 0.019 (in 2 folds),0.962 +/- 0.019 (in 2 folds),0.784,0.58,0.003,Unknown,disease.separate_past_exposures,291,1,292,0.003425,False
lasso_cv,0.890 +/- 0.031 (in 3 folds),0.890 +/- 0.031 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.774 +/- 0.039 (in 3 folds),0.468 +/- 0.102 (in 3 folds),0.774,0.466,disease.separate_past_exposures,,,,,,,,,,,,,292,0,292,0.0,False
lasso_cv.decision_thresholds_tuned,0.890 +/- 0.031 (in 3 folds),0.890 +/- 0.031 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.950 +/- 0.014 (in 3 folds),0.785 +/- 0.091 (in 3 folds),0.591 +/- 0.121 (in 3 folds),0.784,0.565,disease.separate_past_exposures,,,,,,,,,,,,,292,0,292,0.0,False
elasticnet_cv,0.887 +/- 0.035 (in 3 folds),0.887 +/- 0.035 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.781 +/- 0.041 (in 3 folds),0.482 +/- 0.109 (in 3 folds),0.781,0.483,disease.separate_past_exposures,,,,,,,,,,,,,292,0,292,0.0,False
elasticnet_cv.decision_thresholds_tuned,0.887 +/- 0.035 (in 3 folds),0.887 +/- 0.035 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.949 +/- 0.016 (in 3 folds),0.785 +/- 0.086 (in 3 folds),0.586 +/- 0.129 (in 3 folds),0.784,0.561,disease.separate_past_exposures,,,,,,,,,,,,,292,0,292,0.0,False
lasso_multiclass,0.883 +/- 0.026 (in 3 folds),0.883 +/- 0.026 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.790 +/- 0.042 (in 3 folds),0.541 +/- 0.051 (in 3 folds),0.791,0.528,disease.separate_past_exposures,0.778 +/- 0.064 (in 3 folds),0.525 +/- 0.078 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.895 +/- 0.018 (in 2 folds),0.895 +/- 0.018 (in 2 folds),0.956 +/- 0.011 (in 2 folds),0.956 +/- 0.011 (in 2 folds),0.777,0.51,0.017,Unknown,disease.separate_past_exposures,287,5,292,0.017123,False
lasso_multiclass.decision_thresholds_tuned,0.883 +/- 0.026 (in 3 folds),0.883 +/- 0.026 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.949 +/- 0.015 (in 3 folds),0.784 +/- 0.046 (in 3 folds),0.548 +/- 0.111 (in 3 folds),0.784,0.543,disease.separate_past_exposures,0.771 +/- 0.065 (in 3 folds),0.535 +/- 0.133 (in 3 folds),0.051 +/- 0.000 (in 1 folds),0.895 +/- 0.018 (in 2 folds),0.895 +/- 0.018 (in 2 folds),0.956 +/- 0.011 (in 2 folds),0.956 +/- 0.011 (in 2 folds),0.771,0.524,0.017,Unknown,disease.separate_past_exposures,287,5,292,0.017123,False
ridge_cv,0.848 +/- 0.065 (in 3 folds),0.848 +/- 0.065 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.677 +/- 0.019 (in 3 folds),0.075 +/- 0.129 (in 3 folds),0.677,0.117,disease.separate_past_exposures,0.661 +/- 0.007 (in 3 folds),0.078 +/- 0.115 (in 3 folds),0.036 +/- 0.022 (in 2 folds),0.918 +/- 0.000 (in 1 folds),0.918 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds),0.661,0.115,0.024,Unknown,disease.separate_past_exposures,285,7,292,0.023973,False
ridge_cv.decision_thresholds_tuned,0.848 +/- 0.065 (in 3 folds),0.848 +/- 0.065 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.930 +/- 0.030 (in 3 folds),0.685 +/- 0.031 (in 3 folds),0.132 +/- 0.229 (in 3 folds),0.684,0.183,disease.separate_past_exposures,0.668 +/- 0.015 (in 3 folds),0.128 +/- 0.201 (in 3 folds),0.036 +/- 0.022 (in 2 folds),0.918 +/- 0.000 (in 1 folds),0.918 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds),0.962 +/- 0.000 (in 1 folds),0.668,0.177,0.024,Unknown,disease.separate_past_exposures,285,7,292,0.023973,False


linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned,lasso_cv,lasso_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.894 +/- 0.048 (in 3 folds) ROC-AUC (macro OvO): 0.894 +/- 0.048 (in 3 folds) au-PRC (weighted OvO): 0.953 +/- 0.021 (in 3 folds) au-PRC (macro OvO): 0.953 +/- 0.021 (in 3 folds) Accuracy: 0.780 +/- 0.017 (in 3 folds) MCC: 0.518 +/- 0.070 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.780 MCC: 0.488 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.777 +/- 0.015 (in 3 folds) MCC: 0.513 +/- 0.063 (in 3 folds) Unknown/abstention proportion: 0.010 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.915 +/- 0.046 (in 2 folds) ROC-AUC (macro OvO): 0.915 +/- 0.046 (in 2 folds) au-PRC (weighted OvO): 0.962 +/- 0.019 (in 2 folds) au-PRC (macro OvO): 0.962 +/- 0.019 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.777 MCC: 0.485 Unknown/abstention proportion: 0.003 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.70 0.58 0.64 98 Healthy/Background 0.81 0.88 0.84 194  Unknown 0.00 0.00 0.00 0  accuracy 0.78 292  macro avg 0.50 0.49 0.49 292  weighted avg 0.77 0.78 0.77 292,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.894 +/- 0.048 (in 3 folds) ROC-AUC (macro OvO): 0.894 +/- 0.048 (in 3 folds) au-PRC (weighted OvO): 0.953 +/- 0.021 (in 3 folds) au-PRC (macro OvO): 0.953 +/- 0.021 (in 3 folds) Accuracy: 0.787 +/- 0.071 (in 3 folds) MCC: 0.611 +/- 0.067 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.787 MCC: 0.585 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.785 +/- 0.072 (in 3 folds) MCC: 0.606 +/- 0.071 (in 3 folds) Unknown/abstention proportion: 0.010 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.915 +/- 0.046 (in 2 folds) ROC-AUC (macro OvO): 0.915 +/- 0.046 (in 2 folds) au-PRC (weighted OvO): 0.962 +/- 0.019 (in 2 folds) au-PRC (macro OvO): 0.962 +/- 0.019 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.784 MCC: 0.580 Unknown/abstention proportion: 0.003 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.63 0.87 0.73 98 Healthy/Background 0.92 0.74 0.82 194  Unknown 0.00 0.00 0.00 0  accuracy 0.78 292  macro avg 0.52 0.54 0.52 292  weighted avg 0.82 0.78 0.79 292,Per-fold scores: ROC-AUC (weighted OvO): 0.890 +/- 0.031 (in 3 folds) ROC-AUC (macro OvO): 0.890 +/- 0.031 (in 3 folds) au-PRC (weighted OvO): 0.950 +/- 0.014 (in 3 folds) au-PRC (macro OvO): 0.950 +/- 0.014 (in 3 folds) Accuracy: 0.774 +/- 0.039 (in 3 folds) MCC: 0.468 +/- 0.102 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.774 MCC: 0.466 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.74 0.51 0.60 98 Healthy/Background 0.79 0.91 0.84 194  accuracy 0.77 292  macro avg 0.76 0.71 0.72 292  weighted avg 0.77 0.77 0.76 292,Per-fold scores: ROC-AUC (weighted OvO): 0.890 +/- 0.031 (in 3 folds) ROC-AUC (macro OvO): 0.890 +/- 0.031 (in 3 folds) au-PRC (weighted OvO): 0.950 +/- 0.014 (in 3 folds) au-PRC (macro OvO): 0.950 +/- 0.014 (in 3 folds) Accuracy: 0.785 +/- 0.091 (in 3 folds) MCC: 0.591 +/- 0.121 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.784 MCC: 0.565 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.64 0.84 0.72 98 Healthy/Background 0.90 0.76 0.82 194  accuracy 0.78 292  macro avg 0.77 0.80 0.77 292  weighted avg 0.81 0.78 0.79 292
,,,


elasticnet_cv,elasticnet_cv.decision_thresholds_tuned,lasso_multiclass,lasso_multiclass.decision_thresholds_tuned
Per-fold scores: ROC-AUC (weighted OvO): 0.887 +/- 0.035 (in 3 folds) ROC-AUC (macro OvO): 0.887 +/- 0.035 (in 3 folds) au-PRC (weighted OvO): 0.949 +/- 0.016 (in 3 folds) au-PRC (macro OvO): 0.949 +/- 0.016 (in 3 folds) Accuracy: 0.781 +/- 0.041 (in 3 folds) MCC: 0.482 +/- 0.109 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.781 MCC: 0.483 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.76 0.51 0.61 98 Healthy/Background 0.79 0.92 0.85 194  accuracy 0.78 292  macro avg 0.77 0.71 0.73 292  weighted avg 0.78 0.78 0.77 292,Per-fold scores: ROC-AUC (weighted OvO): 0.887 +/- 0.035 (in 3 folds) ROC-AUC (macro OvO): 0.887 +/- 0.035 (in 3 folds) au-PRC (weighted OvO): 0.949 +/- 0.016 (in 3 folds) au-PRC (macro OvO): 0.949 +/- 0.016 (in 3 folds) Accuracy: 0.785 +/- 0.086 (in 3 folds) MCC: 0.586 +/- 0.129 (in 3 folds) Global scores using column name disease.separate_past_exposures: Accuracy: 0.784 MCC: 0.561 Global evaluation column name: disease.separate_past_exposures Global classification report using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.64 0.83 0.72 98 Healthy/Background 0.90 0.76 0.82 194  accuracy 0.78 292  macro avg 0.77 0.79 0.77 292  weighted avg 0.81 0.78 0.79 292,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.883 +/- 0.026 (in 3 folds) ROC-AUC (macro OvO): 0.883 +/- 0.026 (in 3 folds) au-PRC (weighted OvO): 0.949 +/- 0.015 (in 3 folds) au-PRC (macro OvO): 0.949 +/- 0.015 (in 3 folds) Accuracy: 0.790 +/- 0.042 (in 3 folds) MCC: 0.541 +/- 0.051 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.791 MCC: 0.528 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.778 +/- 0.064 (in 3 folds) MCC: 0.525 +/- 0.078 (in 3 folds) Unknown/abstention proportion: 0.051 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.895 +/- 0.018 (in 2 folds) ROC-AUC (macro OvO): 0.895 +/- 0.018 (in 2 folds) au-PRC (weighted OvO): 0.956 +/- 0.011 (in 2 folds) au-PRC (macro OvO): 0.956 +/- 0.011 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.777 MCC: 0.510 Unknown/abstention proportion: 0.017 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.68 0.66 0.67 98 Healthy/Background 0.84 0.84 0.84 194  Unknown 0.00 0.00 0.00 0  accuracy 0.78 292  macro avg 0.51 0.50 0.50 292  weighted avg 0.79 0.78 0.78 292,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.883 +/- 0.026 (in 3 folds) ROC-AUC (macro OvO): 0.883 +/- 0.026 (in 3 folds) au-PRC (weighted OvO): 0.949 +/- 0.015 (in 3 folds) au-PRC (macro OvO): 0.949 +/- 0.015 (in 3 folds) Accuracy: 0.784 +/- 0.046 (in 3 folds) MCC: 0.548 +/- 0.111 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.784 MCC: 0.543 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.771 +/- 0.065 (in 3 folds) MCC: 0.535 +/- 0.133 (in 3 folds) Unknown/abstention proportion: 0.051 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.895 +/- 0.018 (in 2 folds) ROC-AUC (macro OvO): 0.895 +/- 0.018 (in 2 folds) au-PRC (weighted OvO): 0.956 +/- 0.011 (in 2 folds) au-PRC (macro OvO): 0.956 +/- 0.011 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.771 MCC: 0.524 Unknown/abstention proportion: 0.017 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.64 0.76 0.69 98 Healthy/Background 0.88 0.78 0.83 194  Unknown 0.00 0.00 0.00 0  accuracy 0.77 292  macro avg 0.51 0.51 0.51 292  weighted avg 0.80 0.77 0.78 292
,,,


ridge_cv,ridge_cv.decision_thresholds_tuned,xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.848 +/- 0.065 (in 3 folds) ROC-AUC (macro OvO): 0.848 +/- 0.065 (in 3 folds) au-PRC (weighted OvO): 0.930 +/- 0.030 (in 3 folds) au-PRC (macro OvO): 0.930 +/- 0.030 (in 3 folds) Accuracy: 0.677 +/- 0.019 (in 3 folds) MCC: 0.075 +/- 0.129 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.677 MCC: 0.117 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.661 +/- 0.007 (in 3 folds) MCC: 0.078 +/- 0.115 (in 3 folds) Unknown/abstention proportion: 0.036 +/- 0.022 (in 2 folds) ROC-AUC (weighted OvO): 0.918 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.918 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.962 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.962 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.661 MCC: 0.115 Unknown/abstention proportion: 0.024 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.57 0.08 0.14 98 Healthy/Background 0.68 0.95 0.80 194  Unknown 0.00 0.00 0.00 0  accuracy 0.66 292  macro avg 0.42 0.35 0.31 292  weighted avg 0.65 0.66 0.58 292,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.848 +/- 0.065 (in 3 folds) ROC-AUC (macro OvO): 0.848 +/- 0.065 (in 3 folds) au-PRC (weighted OvO): 0.930 +/- 0.030 (in 3 folds) au-PRC (macro OvO): 0.930 +/- 0.030 (in 3 folds) Accuracy: 0.685 +/- 0.031 (in 3 folds) MCC: 0.132 +/- 0.229 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.684 MCC: 0.183 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.668 +/- 0.015 (in 3 folds) MCC: 0.128 +/- 0.201 (in 3 folds) Unknown/abstention proportion: 0.036 +/- 0.022 (in 2 folds) ROC-AUC (weighted OvO): 0.918 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.918 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.962 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.962 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.668 MCC: 0.177 Unknown/abstention proportion: 0.024 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.56 0.20 0.30 98 Healthy/Background 0.70 0.90 0.79 194  Unknown 0.00 0.00 0.00 0  accuracy 0.67 292  macro avg 0.42 0.37 0.36 292  weighted avg 0.65 0.67 0.63 292,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.837 +/- 0.014 (in 3 folds) ROC-AUC (macro OvO): 0.837 +/- 0.014 (in 3 folds) au-PRC (weighted OvO): 0.923 +/- 0.005 (in 3 folds) au-PRC (macro OvO): 0.923 +/- 0.005 (in 3 folds) Accuracy: 0.739 +/- 0.030 (in 3 folds) MCC: 0.411 +/- 0.099 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.739 MCC: 0.409 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.736 +/- 0.025 (in 3 folds) MCC: 0.407 +/- 0.093 (in 3 folds) Unknown/abstention proportion: 0.010 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.829 +/- 0.009 (in 2 folds) ROC-AUC (macro OvO): 0.829 +/- 0.009 (in 2 folds) au-PRC (weighted OvO): 0.921 +/- 0.002 (in 2 folds) au-PRC (macro OvO): 0.921 +/- 0.002 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.736 MCC: 0.407 Unknown/abstention proportion: 0.003 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.61 0.59 0.60 98 Healthy/Background 0.80 0.81 0.81 194  Unknown 0.00 0.00 0.00 0  accuracy 0.74 292  macro avg 0.47 0.47 0.47 292  weighted avg 0.74 0.74 0.74 292,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.837 +/- 0.014 (in 3 folds) ROC-AUC (macro OvO): 0.837 +/- 0.014 (in 3 folds) au-PRC (weighted OvO): 0.923 +/- 0.005 (in 3 folds) au-PRC (macro OvO): 0.923 +/- 0.005 (in 3 folds) Accuracy: 0.732 +/- 0.036 (in 3 folds) MCC: 0.408 +/- 0.113 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.732 MCC: 0.407 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.729 +/- 0.032 (in 3 folds) MCC: 0.404 +/- 0.106 (in 3 folds) Unknown/abstention proportion: 0.010 +/- 0.000 (in 1 folds) ROC-AUC (weighted OvO): 0.829 +/- 0.009 (in 2 folds) ROC-AUC (macro OvO): 0.829 +/- 0.009 (in 2 folds) au-PRC (weighted OvO): 0.921 +/- 0.002 (in 2 folds) au-PRC (macro OvO): 0.921 +/- 0.002 (in 2 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.729 MCC: 0.404 Unknown/abstention proportion: 0.003 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.59 0.62 0.61 98 Healthy/Background 0.81 0.78 0.80 194  Unknown 0.00 0.00 0.00 0  accuracy 0.73 292  macro avg 0.47 0.47 0.47 292  weighted avg 0.74 0.73 0.73 292
,,,


rf_multiclass,rf_multiclass.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.825 +/- 0.007 (in 3 folds) ROC-AUC (macro OvO): 0.825 +/- 0.007 (in 3 folds) au-PRC (weighted OvO): 0.904 +/- 0.005 (in 3 folds) au-PRC (macro OvO): 0.904 +/- 0.005 (in 3 folds) Accuracy: 0.761 +/- 0.021 (in 3 folds) MCC: 0.464 +/- 0.070 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.761 MCC: 0.455 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.754 +/- 0.028 (in 3 folds) MCC: 0.454 +/- 0.075 (in 3 folds) Unknown/abstention proportion: 0.015 +/- 0.007 (in 2 folds) ROC-AUC (weighted OvO): 0.831 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.831 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.902 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.902 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.753 MCC: 0.446 Unknown/abstention proportion: 0.010 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.65 0.60 0.62 98 Healthy/Background 0.81 0.83 0.82 194  Unknown 0.00 0.00 0.00 0  accuracy 0.75 292  macro avg 0.49 0.48 0.48 292  weighted avg 0.76 0.75 0.76 292,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.825 +/- 0.007 (in 3 folds) ROC-AUC (macro OvO): 0.825 +/- 0.007 (in 3 folds) au-PRC (weighted OvO): 0.904 +/- 0.005 (in 3 folds) au-PRC (macro OvO): 0.904 +/- 0.005 (in 3 folds) Accuracy: 0.723 +/- 0.040 (in 3 folds) MCC: 0.474 +/- 0.051 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.723 MCC: 0.473 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.716 +/- 0.046 (in 3 folds) MCC: 0.464 +/- 0.058 (in 3 folds) Unknown/abstention proportion: 0.015 +/- 0.007 (in 2 folds) ROC-AUC (weighted OvO): 0.831 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.831 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.902 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.902 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.716 MCC: 0.462 Unknown/abstention proportion: 0.010 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support  HIV 0.56 0.82 0.66 98 Healthy/Background 0.89 0.66 0.76 194  Unknown 0.00 0.00 0.00 0  accuracy 0.72 292  macro avg 0.48 0.49 0.47 292  weighted avg 0.78 0.72 0.73 292
,


---

# GeneLocus.TCR, TargetObsColumnEnum.lupus_vs_healthy trained on train_smaller set

## Specimen predictions on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.951 +/- 0.033 (in 3 folds),0.951 +/- 0.033 (in 3 folds),0.892 +/- 0.058 (in 3 folds),0.892 +/- 0.058 (in 3 folds),0.788 +/- 0.020 (in 3 folds),0.249 +/- 0.219 (in 3 folds),0.788,0.309,0.779 +/- 0.021 (in 3 folds),0.264 +/- 0.127 (in 3 folds),0.017 +/- 0.000 (in 2 folds),0.913 +/- 0.000 (in 1 folds),0.913 +/- 0.000 (in 1 folds),0.825 +/- 0.000 (in 1 folds),0.825 +/- 0.000 (in 1 folds),0.779,0.275,0.012,Unknown,170.0,2.0,172.0,0.011628,False
ridge_cv,0.945 +/- 0.029 (in 3 folds),0.945 +/- 0.029 (in 3 folds),0.875 +/- 0.054 (in 3 folds),0.875 +/- 0.054 (in 3 folds),0.759 +/- 0.008 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.759,0.0,0.750 +/- 0.008 (in 3 folds),0.027 +/- 0.081 (in 3 folds),0.017 +/- 0.000 (in 2 folds),0.913 +/- 0.000 (in 1 folds),0.913 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds),0.75,0.032,0.012,Unknown,170.0,2.0,172.0,0.011628,True
linearsvm_ovr,0.925 +/- 0.080 (in 3 folds),0.925 +/- 0.080 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.898 +/- 0.047 (in 3 folds),0.724 +/- 0.122 (in 3 folds),0.899,0.72,0.878 +/- 0.053 (in 3 folds),0.681 +/- 0.125 (in 3 folds),0.023 +/- 0.010 (in 3 folds),,,,,0.878,0.675,0.023,Unknown,168.0,4.0,172.0,0.023256,False
lasso_multiclass,0.925 +/- 0.080 (in 3 folds),0.925 +/- 0.080 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.892 +/- 0.038 (in 3 folds),0.708 +/- 0.096 (in 3 folds),0.893,0.701,0.872 +/- 0.045 (in 3 folds),0.665 +/- 0.100 (in 3 folds),0.023 +/- 0.010 (in 3 folds),,,,,0.872,0.657,0.023,Unknown,168.0,4.0,172.0,0.023256,False
lasso_cv,0.919 +/- 0.021 (in 3 folds),0.919 +/- 0.021 (in 3 folds),0.825 +/- 0.047 (in 3 folds),0.825 +/- 0.047 (in 3 folds),0.840 +/- 0.061 (in 3 folds),0.507 +/- 0.220 (in 3 folds),0.84,0.531,0.825 +/- 0.048 (in 3 folds),0.474 +/- 0.170 (in 3 folds),0.026 +/- 0.012 (in 2 folds),0.908 +/- 0.000 (in 1 folds),0.908 +/- 0.000 (in 1 folds),0.803 +/- 0.000 (in 1 folds),0.803 +/- 0.000 (in 1 folds),0.826,0.482,0.017,Unknown,169.0,3.0,172.0,0.017442,False
xgboost,0.918 +/- 0.033 (in 3 folds),0.918 +/- 0.033 (in 3 folds),0.829 +/- 0.051 (in 3 folds),0.829 +/- 0.051 (in 3 folds),0.887 +/- 0.027 (in 3 folds),0.684 +/- 0.067 (in 3 folds),0.887,0.68,0.866 +/- 0.021 (in 3 folds),0.639 +/- 0.044 (in 3 folds),0.023 +/- 0.010 (in 3 folds),,,,,0.866,0.635,0.023,Unknown,168.0,4.0,172.0,0.023256,False
rf_multiclass,0.909 +/- 0.055 (in 3 folds),0.909 +/- 0.055 (in 3 folds),0.827 +/- 0.096 (in 3 folds),0.827 +/- 0.096 (in 3 folds),0.869 +/- 0.041 (in 3 folds),0.646 +/- 0.086 (in 3 folds),0.869,0.63,0.849 +/- 0.037 (in 3 folds),0.605 +/- 0.072 (in 3 folds),0.023 +/- 0.010 (in 3 folds),,,,,0.849,0.589,0.023,Unknown,168.0,4.0,172.0,0.023256,False
dummy_stratified,0.509 +/- 0.080 (in 3 folds),0.509 +/- 0.080 (in 3 folds),0.311 +/- 0.082 (in 3 folds),0.311 +/- 0.082 (in 3 folds),0.586 +/- 0.025 (in 3 folds),0.016 +/- 0.155 (in 3 folds),0.581,-0.001,0.418 +/- 0.121 (in 3 folds),-0.031 +/- 0.092 (in 3 folds),0.280 +/- 0.233 (in 3 folds),,,,,0.419,-0.028,0.279,Unknown,124.0,48.0,172.0,0.27907,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.241 +/- 0.008 (in 3 folds),0.241 +/- 0.008 (in 3 folds),0.759 +/- 0.008 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.759,0.0,0.750 +/- 0.008 (in 3 folds),0.027 +/- 0.081 (in 3 folds),0.017 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.246 +/- 0.000 (in 1 folds),0.246 +/- 0.000 (in 1 folds),0.75,0.032,0.012,Unknown,170.0,2.0,172.0,0.011628,True
"All results, sorted",,,,,,,,,,,,,,,,,,,,,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes
elasticnet_cv,0.951 +/- 0.033 (in 3 folds),0.951 +/- 0.033 (in 3 folds),0.892 +/- 0.058 (in 3 folds),0.892 +/- 0.058 (in 3 folds),0.788 +/- 0.020 (in 3 folds),0.249 +/- 0.219 (in 3 folds),0.788,0.309,0.779 +/- 0.021 (in 3 folds),0.264 +/- 0.127 (in 3 folds),0.017 +/- 0.000 (in 2 folds),0.913 +/- 0.000 (in 1 folds),0.913 +/- 0.000 (in 1 folds),0.825 +/- 0.000 (in 1 folds),0.825 +/- 0.000 (in 1 folds),0.779,0.275,0.012,Unknown,170,2,172,0.011628,False
ridge_cv,0.945 +/- 0.029 (in 3 folds),0.945 +/- 0.029 (in 3 folds),0.875 +/- 0.054 (in 3 folds),0.875 +/- 0.054 (in 3 folds),0.759 +/- 0.008 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.759,0.0,0.750 +/- 0.008 (in 3 folds),0.027 +/- 0.081 (in 3 folds),0.017 +/- 0.000 (in 2 folds),0.913 +/- 0.000 (in 1 folds),0.913 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds),0.824 +/- 0.000 (in 1 folds),0.75,0.032,0.012,Unknown,170,2,172,0.011628,True
linearsvm_ovr,0.925 +/- 0.080 (in 3 folds),0.925 +/- 0.080 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.898 +/- 0.047 (in 3 folds),0.724 +/- 0.122 (in 3 folds),0.899,0.72,0.878 +/- 0.053 (in 3 folds),0.681 +/- 0.125 (in 3 folds),0.023 +/- 0.010 (in 3 folds),,,,,0.878,0.675,0.023,Unknown,168,4,172,0.023256,False
lasso_multiclass,0.925 +/- 0.080 (in 3 folds),0.925 +/- 0.080 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.862 +/- 0.117 (in 3 folds),0.892 +/- 0.038 (in 3 folds),0.708 +/- 0.096 (in 3 folds),0.893,0.701,0.872 +/- 0.045 (in 3 folds),0.665 +/- 0.100 (in 3 folds),0.023 +/- 0.010 (in 3 folds),,,,,0.872,0.657,0.023,Unknown,168,4,172,0.023256,False
lasso_cv,0.919 +/- 0.021 (in 3 folds),0.919 +/- 0.021 (in 3 folds),0.825 +/- 0.047 (in 3 folds),0.825 +/- 0.047 (in 3 folds),0.840 +/- 0.061 (in 3 folds),0.507 +/- 0.220 (in 3 folds),0.84,0.531,0.825 +/- 0.048 (in 3 folds),0.474 +/- 0.170 (in 3 folds),0.026 +/- 0.012 (in 2 folds),0.908 +/- 0.000 (in 1 folds),0.908 +/- 0.000 (in 1 folds),0.803 +/- 0.000 (in 1 folds),0.803 +/- 0.000 (in 1 folds),0.826,0.482,0.017,Unknown,169,3,172,0.017442,False
xgboost,0.918 +/- 0.033 (in 3 folds),0.918 +/- 0.033 (in 3 folds),0.829 +/- 0.051 (in 3 folds),0.829 +/- 0.051 (in 3 folds),0.887 +/- 0.027 (in 3 folds),0.684 +/- 0.067 (in 3 folds),0.887,0.68,0.866 +/- 0.021 (in 3 folds),0.639 +/- 0.044 (in 3 folds),0.023 +/- 0.010 (in 3 folds),,,,,0.866,0.635,0.023,Unknown,168,4,172,0.023256,False
rf_multiclass,0.909 +/- 0.055 (in 3 folds),0.909 +/- 0.055 (in 3 folds),0.827 +/- 0.096 (in 3 folds),0.827 +/- 0.096 (in 3 folds),0.869 +/- 0.041 (in 3 folds),0.646 +/- 0.086 (in 3 folds),0.869,0.63,0.849 +/- 0.037 (in 3 folds),0.605 +/- 0.072 (in 3 folds),0.023 +/- 0.010 (in 3 folds),,,,,0.849,0.589,0.023,Unknown,168,4,172,0.023256,False
dummy_stratified,0.509 +/- 0.080 (in 3 folds),0.509 +/- 0.080 (in 3 folds),0.311 +/- 0.082 (in 3 folds),0.311 +/- 0.082 (in 3 folds),0.586 +/- 0.025 (in 3 folds),0.016 +/- 0.155 (in 3 folds),0.581,-0.001,0.418 +/- 0.121 (in 3 folds),-0.031 +/- 0.092 (in 3 folds),0.280 +/- 0.233 (in 3 folds),,,,,0.419,-0.028,0.279,Unknown,124,48,172,0.27907,False
dummy_most_frequent,0.500 +/- 0.000 (in 3 folds),0.500 +/- 0.000 (in 3 folds),0.241 +/- 0.008 (in 3 folds),0.241 +/- 0.008 (in 3 folds),0.759 +/- 0.008 (in 3 folds),0.000 +/- 0.000 (in 3 folds),0.759,0.0,0.750 +/- 0.008 (in 3 folds),0.027 +/- 0.081 (in 3 folds),0.017 +/- 0.000 (in 2 folds),0.500 +/- 0.000 (in 1 folds),0.500 +/- 0.000 (in 1 folds),0.246 +/- 0.000 (in 1 folds),0.246 +/- 0.000 (in 1 folds),0.75,0.032,0.012,Unknown,170,2,172,0.011628,True


elasticnet_cv,ridge_cv,linearsvm_ovr,lasso_multiclass
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.951 +/- 0.033 (in 3 folds) ROC-AUC (macro OvO): 0.951 +/- 0.033 (in 3 folds) au-PRC (weighted OvO): 0.892 +/- 0.058 (in 3 folds) au-PRC (macro OvO): 0.892 +/- 0.058 (in 3 folds) Accuracy: 0.788 +/- 0.020 (in 3 folds) MCC: 0.249 +/- 0.219 (in 3 folds) Global scores without abstention: Accuracy: 0.788 MCC: 0.309 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.779 +/- 0.021 (in 3 folds) MCC: 0.264 +/- 0.127 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.913 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.913 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.825 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.825 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.779 MCC: 0.275 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.78 0.99 0.87 130  Lupus 1.00 0.12 0.21 42  Unknown 0.00 0.00 0.00 0  accuracy 0.78 172  macro avg 0.59 0.37 0.36 172  weighted avg 0.84 0.78 0.71 172,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.945 +/- 0.029 (in 3 folds) ROC-AUC (macro OvO): 0.945 +/- 0.029 (in 3 folds) au-PRC (weighted OvO): 0.875 +/- 0.054 (in 3 folds) au-PRC (macro OvO): 0.875 +/- 0.054 (in 3 folds) Accuracy: 0.759 +/- 0.008 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.759 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.750 +/- 0.008 (in 3 folds) MCC: 0.027 +/- 0.081 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.913 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.913 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.824 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.824 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.750 MCC: 0.032 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.76 0.99 0.86 130  Lupus 0.00 0.00 0.00 42  Unknown 0.00 0.00 0.00 0  accuracy 0.75 172  macro avg 0.25 0.33 0.29 172  weighted avg 0.57 0.75 0.65 172,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.925 +/- 0.080 (in 3 folds) ROC-AUC (macro OvO): 0.925 +/- 0.080 (in 3 folds) au-PRC (weighted OvO): 0.862 +/- 0.117 (in 3 folds) au-PRC (macro OvO): 0.862 +/- 0.117 (in 3 folds) Accuracy: 0.898 +/- 0.047 (in 3 folds) MCC: 0.724 +/- 0.122 (in 3 folds) Global scores without abstention: Accuracy: 0.899 MCC: 0.720 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.878 +/- 0.053 (in 3 folds) MCC: 0.681 +/- 0.125 (in 3 folds) Unknown/abstention proportion: 0.023 +/- 0.010 (in 3 folds) Global scores with abstention: Accuracy: 0.878 MCC: 0.675 Unknown/abstention proportion: 0.023 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.92 0.92 0.92 130  Lupus 0.82 0.74 0.78 42  Unknown 0.00 0.00 0.00 0  accuracy 0.88 172  macro avg 0.58 0.55 0.57 172  weighted avg 0.90 0.88 0.89 172,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.925 +/- 0.080 (in 3 folds) ROC-AUC (macro OvO): 0.925 +/- 0.080 (in 3 folds) au-PRC (weighted OvO): 0.862 +/- 0.117 (in 3 folds) au-PRC (macro OvO): 0.862 +/- 0.117 (in 3 folds) Accuracy: 0.892 +/- 0.038 (in 3 folds) MCC: 0.708 +/- 0.096 (in 3 folds) Global scores without abstention: Accuracy: 0.893 MCC: 0.701 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.872 +/- 0.045 (in 3 folds) MCC: 0.665 +/- 0.100 (in 3 folds) Unknown/abstention proportion: 0.023 +/- 0.010 (in 3 folds) Global scores with abstention: Accuracy: 0.872 MCC: 0.657 Unknown/abstention proportion: 0.023 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.92 0.92 0.92 130  Lupus 0.81 0.71 0.76 42  Unknown 0.00 0.00 0.00 0  accuracy 0.87 172  macro avg 0.58 0.55 0.56 172  weighted avg 0.89 0.87 0.88 172
,,,


lasso_cv,xgboost,rf_multiclass,dummy_stratified
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.919 +/- 0.021 (in 3 folds) ROC-AUC (macro OvO): 0.919 +/- 0.021 (in 3 folds) au-PRC (weighted OvO): 0.825 +/- 0.047 (in 3 folds) au-PRC (macro OvO): 0.825 +/- 0.047 (in 3 folds) Accuracy: 0.840 +/- 0.061 (in 3 folds) MCC: 0.507 +/- 0.220 (in 3 folds) Global scores without abstention: Accuracy: 0.840 MCC: 0.531 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.825 +/- 0.048 (in 3 folds) MCC: 0.474 +/- 0.170 (in 3 folds) Unknown/abstention proportion: 0.026 +/- 0.012 (in 2 folds) ROC-AUC (weighted OvO): 0.908 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.908 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.803 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.803 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.826 MCC: 0.482 Unknown/abstention proportion: 0.017 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.83 0.98 0.90 130  Lupus 1.00 0.33 0.50 42  Unknown 0.00 0.00 0.00 0  accuracy 0.83 172  macro avg 0.61 0.44 0.47 172  weighted avg 0.87 0.83 0.80 172,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.918 +/- 0.033 (in 3 folds) ROC-AUC (macro OvO): 0.918 +/- 0.033 (in 3 folds) au-PRC (weighted OvO): 0.829 +/- 0.051 (in 3 folds) au-PRC (macro OvO): 0.829 +/- 0.051 (in 3 folds) Accuracy: 0.887 +/- 0.027 (in 3 folds) MCC: 0.684 +/- 0.067 (in 3 folds) Global scores without abstention: Accuracy: 0.887 MCC: 0.680 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.866 +/- 0.021 (in 3 folds) MCC: 0.639 +/- 0.044 (in 3 folds) Unknown/abstention proportion: 0.023 +/- 0.010 (in 3 folds) Global scores with abstention: Accuracy: 0.866 MCC: 0.635 Unknown/abstention proportion: 0.023 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.90 0.93 0.92 130  Lupus 0.82 0.67 0.74 42  Unknown 0.00 0.00 0.00 0  accuracy 0.87 172  macro avg 0.58 0.53 0.55 172  weighted avg 0.88 0.87 0.87 172,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.909 +/- 0.055 (in 3 folds) ROC-AUC (macro OvO): 0.909 +/- 0.055 (in 3 folds) au-PRC (weighted OvO): 0.827 +/- 0.096 (in 3 folds) au-PRC (macro OvO): 0.827 +/- 0.096 (in 3 folds) Accuracy: 0.869 +/- 0.041 (in 3 folds) MCC: 0.646 +/- 0.086 (in 3 folds) Global scores without abstention: Accuracy: 0.869 MCC: 0.630 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.849 +/- 0.037 (in 3 folds) MCC: 0.605 +/- 0.072 (in 3 folds) Unknown/abstention proportion: 0.023 +/- 0.010 (in 3 folds) Global scores with abstention: Accuracy: 0.849 MCC: 0.589 Unknown/abstention proportion: 0.023 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.89 0.92 0.90 130  Lupus 0.77 0.64 0.70 42  Unknown 0.00 0.00 0.00 0  accuracy 0.85 172  macro avg 0.56 0.52 0.54 172  weighted avg 0.86 0.85 0.86 172,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.509 +/- 0.080 (in 3 folds) ROC-AUC (macro OvO): 0.509 +/- 0.080 (in 3 folds) au-PRC (weighted OvO): 0.311 +/- 0.082 (in 3 folds) au-PRC (macro OvO): 0.311 +/- 0.082 (in 3 folds) Accuracy: 0.586 +/- 0.025 (in 3 folds) MCC: 0.016 +/- 0.155 (in 3 folds) Global scores without abstention: Accuracy: 0.581 MCC: -0.001 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.418 +/- 0.121 (in 3 folds) MCC: -0.031 +/- 0.092 (in 3 folds) Unknown/abstention proportion: 0.280 +/- 0.233 (in 3 folds) Global scores with abstention: Accuracy: 0.419 MCC: -0.028 Unknown/abstention proportion: 0.279 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.71 0.47 0.56 130  Lupus 0.29 0.26 0.28 42  Unknown 0.00 0.00 0.00 0  accuracy 0.42 172  macro avg 0.33 0.24 0.28 172  weighted avg 0.61 0.42 0.49 172
,,,


dummy_most_frequent
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 3 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 3 folds) au-PRC (weighted OvO): 0.241 +/- 0.008 (in 3 folds) au-PRC (macro OvO): 0.241 +/- 0.008 (in 3 folds) Accuracy: 0.759 +/- 0.008 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention: Accuracy: 0.759 MCC: 0.000 Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.750 +/- 0.008 (in 3 folds) MCC: 0.027 +/- 0.081 (in 3 folds) Unknown/abstention proportion: 0.017 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.500 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.500 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.246 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.246 +/- 0.000 (in 1 folds) Global scores with abstention: Accuracy: 0.750 MCC: 0.032 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global classification report with abstention:  precision recall f1-score support Healthy/Background 0.76 0.99 0.86 130  Lupus 0.00 0.00 0.00 42  Unknown 0.00 0.00 0.00 0  accuracy 0.75 172  macro avg 0.25 0.33 0.29 172  weighted avg 0.57 0.75 0.65 172


## Apply train-smaller model -- Test set performance - With and without tuning on validation set

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
rf_multiclass,0.871 +/- 0.044 (in 3 folds),0.871 +/- 0.044 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.850 +/- 0.010 (in 3 folds),0.592 +/- 0.047 (in 3 folds),0.85,0.587,disease.separate_past_exposures,0.837 +/- 0.022 (in 3 folds),0.566 +/- 0.072 (in 3 folds),0.023 +/- 0.017 (in 2 folds),0.837,0.562,0.016,Unknown,disease.separate_past_exposures,254.0,4.0,258.0,0.015504,False,0.889 +/- 0.000 (in 1 folds),0.889 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds)
rf_multiclass.decision_thresholds_tuned,0.871 +/- 0.044 (in 3 folds),0.871 +/- 0.044 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.838 +/- 0.029 (in 3 folds),0.550 +/- 0.135 (in 3 folds),0.839,0.548,disease.separate_past_exposures,0.825 +/- 0.042 (in 3 folds),0.526 +/- 0.157 (in 3 folds),0.023 +/- 0.017 (in 2 folds),0.826,0.524,0.016,Unknown,disease.separate_past_exposures,254.0,4.0,258.0,0.015504,False,0.889 +/- 0.000 (in 1 folds),0.889 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds)
xgboost,0.868 +/- 0.039 (in 3 folds),0.868 +/- 0.039 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.824 +/- 0.019 (in 3 folds),0.501 +/- 0.031 (in 3 folds),0.824,0.492,disease.separate_past_exposures,0.814 +/- 0.022 (in 3 folds),0.485 +/- 0.045 (in 3 folds),0.035 +/- 0.000 (in 1 folds),0.814,0.475,0.012,Unknown,disease.separate_past_exposures,255.0,3.0,258.0,0.011628,False,0.889 +/- 0.023 (in 2 folds),0.889 +/- 0.023 (in 2 folds),0.786 +/- 0.013 (in 2 folds),0.786 +/- 0.013 (in 2 folds)
xgboost.decision_thresholds_tuned,0.868 +/- 0.039 (in 3 folds),0.868 +/- 0.039 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.842 +/- 0.035 (in 3 folds),0.539 +/- 0.121 (in 3 folds),0.843,0.546,disease.separate_past_exposures,0.833 +/- 0.050 (in 3 folds),0.524 +/- 0.146 (in 3 folds),0.035 +/- 0.000 (in 1 folds),0.833,0.526,0.012,Unknown,disease.separate_past_exposures,255.0,3.0,258.0,0.011628,False,0.889 +/- 0.023 (in 2 folds),0.889 +/- 0.023 (in 2 folds),0.786 +/- 0.013 (in 2 folds),0.786 +/- 0.013 (in 2 folds)
elasticnet_cv,0.838 +/- 0.023 (in 3 folds),0.838 +/- 0.023 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.766 +/- 0.019 (in 3 folds),0.181 +/- 0.156 (in 3 folds),0.766,0.218,disease.separate_past_exposures,0.760 +/- 0.022 (in 3 folds),0.148 +/- 0.159 (in 3 folds),0.012 +/- 0.000 (in 2 folds),0.76,0.164,0.008,Unknown,disease.separate_past_exposures,256.0,2.0,258.0,0.007752,False,0.827 +/- 0.000 (in 1 folds),0.827 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds)
elasticnet_cv.decision_thresholds_tuned,0.838 +/- 0.023 (in 3 folds),0.838 +/- 0.023 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.805 +/- 0.070 (in 3 folds),0.497 +/- 0.144 (in 3 folds),0.805,0.479,disease.separate_past_exposures,0.798 +/- 0.065 (in 3 folds),0.482 +/- 0.130 (in 3 folds),0.012 +/- 0.000 (in 2 folds),0.798,0.468,0.008,Unknown,disease.separate_past_exposures,256.0,2.0,258.0,0.007752,False,0.827 +/- 0.000 (in 1 folds),0.827 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds)
lasso_cv,0.837 +/- 0.032 (in 3 folds),0.837 +/- 0.032 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.820 +/- 0.042 (in 3 folds),0.457 +/- 0.143 (in 3 folds),0.82,0.461,disease.separate_past_exposures,0.810 +/- 0.027 (in 3 folds),0.433 +/- 0.106 (in 3 folds),0.035 +/- 0.000 (in 1 folds),0.81,0.429,0.012,Unknown,disease.separate_past_exposures,255.0,3.0,258.0,0.011628,False,0.848 +/- 0.038 (in 2 folds),0.848 +/- 0.038 (in 2 folds),0.733 +/- 0.111 (in 2 folds),0.733 +/- 0.111 (in 2 folds)
lasso_cv.decision_thresholds_tuned,0.837 +/- 0.032 (in 3 folds),0.837 +/- 0.032 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.824 +/- 0.079 (in 3 folds),0.538 +/- 0.158 (in 3 folds),0.824,0.509,disease.separate_past_exposures,0.814 +/- 0.073 (in 3 folds),0.513 +/- 0.147 (in 3 folds),0.035 +/- 0.000 (in 1 folds),0.814,0.493,0.012,Unknown,disease.separate_past_exposures,255.0,3.0,258.0,0.011628,False,0.848 +/- 0.038 (in 2 folds),0.848 +/- 0.038 (in 2 folds),0.733 +/- 0.111 (in 2 folds),0.733 +/- 0.111 (in 2 folds)
lasso_multiclass,0.835 +/- 0.027 (in 3 folds),0.835 +/- 0.027 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.830 +/- 0.041 (in 3 folds),0.552 +/- 0.085 (in 3 folds),0.83,0.548,disease.separate_past_exposures,0.814 +/- 0.051 (in 3 folds),0.525 +/- 0.095 (in 3 folds),0.019 +/- 0.013 (in 3 folds),0.814,0.518,0.019,Unknown,disease.separate_past_exposures,253.0,5.0,258.0,0.01938,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.835 +/- 0.027 (in 3 folds),0.835 +/- 0.027 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.830 +/- 0.030 (in 3 folds),0.524 +/- 0.079 (in 3 folds),0.83,0.524,disease.separate_past_exposures,0.814 +/- 0.040 (in 3 folds),0.493 +/- 0.093 (in 3 folds),0.019 +/- 0.013 (in 3 folds),0.814,0.489,0.019,Unknown,disease.separate_past_exposures,253.0,5.0,258.0,0.01938,False,,,,

Unnamed: 0,ROC-AUC (weighted OvO) per fold,ROC-AUC (macro OvO) per fold,au-PRC (weighted OvO) per fold,au-PRC (macro OvO) per fold,Accuracy per fold,MCC per fold,Accuracy global,MCC global,Global evaluation column name global,Accuracy per fold with abstention,MCC per fold with abstention,Unknown/abstention proportion per fold with abstention,Accuracy global with abstention,MCC global with abstention,Unknown/abstention proportion global with abstention,Abstention label global with abstention,Global evaluation column name global with abstention,sample_size,n_abstentions,sample_size including abstentions,abstention_rate,missing_classes,ROC-AUC (weighted OvO) per fold with abstention,ROC-AUC (macro OvO) per fold with abstention,au-PRC (weighted OvO) per fold with abstention,au-PRC (macro OvO) per fold with abstention
rf_multiclass,0.871 +/- 0.044 (in 3 folds),0.871 +/- 0.044 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.850 +/- 0.010 (in 3 folds),0.592 +/- 0.047 (in 3 folds),0.85,0.587,disease.separate_past_exposures,0.837 +/- 0.022 (in 3 folds),0.566 +/- 0.072 (in 3 folds),0.023 +/- 0.017 (in 2 folds),0.837,0.562,0.016,Unknown,disease.separate_past_exposures,254,4,258,0.015504,False,0.889 +/- 0.000 (in 1 folds),0.889 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds)
rf_multiclass.decision_thresholds_tuned,0.871 +/- 0.044 (in 3 folds),0.871 +/- 0.044 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.754 +/- 0.084 (in 3 folds),0.838 +/- 0.029 (in 3 folds),0.550 +/- 0.135 (in 3 folds),0.839,0.548,disease.separate_past_exposures,0.825 +/- 0.042 (in 3 folds),0.526 +/- 0.157 (in 3 folds),0.023 +/- 0.017 (in 2 folds),0.826,0.524,0.016,Unknown,disease.separate_past_exposures,254,4,258,0.015504,False,0.889 +/- 0.000 (in 1 folds),0.889 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds),0.778 +/- 0.000 (in 1 folds)
xgboost,0.868 +/- 0.039 (in 3 folds),0.868 +/- 0.039 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.824 +/- 0.019 (in 3 folds),0.501 +/- 0.031 (in 3 folds),0.824,0.492,disease.separate_past_exposures,0.814 +/- 0.022 (in 3 folds),0.485 +/- 0.045 (in 3 folds),0.035 +/- 0.000 (in 1 folds),0.814,0.475,0.012,Unknown,disease.separate_past_exposures,255,3,258,0.011628,False,0.889 +/- 0.023 (in 2 folds),0.889 +/- 0.023 (in 2 folds),0.786 +/- 0.013 (in 2 folds),0.786 +/- 0.013 (in 2 folds)
xgboost.decision_thresholds_tuned,0.868 +/- 0.039 (in 3 folds),0.868 +/- 0.039 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.746 +/- 0.070 (in 3 folds),0.842 +/- 0.035 (in 3 folds),0.539 +/- 0.121 (in 3 folds),0.843,0.546,disease.separate_past_exposures,0.833 +/- 0.050 (in 3 folds),0.524 +/- 0.146 (in 3 folds),0.035 +/- 0.000 (in 1 folds),0.833,0.526,0.012,Unknown,disease.separate_past_exposures,255,3,258,0.011628,False,0.889 +/- 0.023 (in 2 folds),0.889 +/- 0.023 (in 2 folds),0.786 +/- 0.013 (in 2 folds),0.786 +/- 0.013 (in 2 folds)
elasticnet_cv,0.838 +/- 0.023 (in 3 folds),0.838 +/- 0.023 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.766 +/- 0.019 (in 3 folds),0.181 +/- 0.156 (in 3 folds),0.766,0.218,disease.separate_past_exposures,0.760 +/- 0.022 (in 3 folds),0.148 +/- 0.159 (in 3 folds),0.012 +/- 0.000 (in 2 folds),0.76,0.164,0.008,Unknown,disease.separate_past_exposures,256,2,258,0.007752,False,0.827 +/- 0.000 (in 1 folds),0.827 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds)
elasticnet_cv.decision_thresholds_tuned,0.838 +/- 0.023 (in 3 folds),0.838 +/- 0.023 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.726 +/- 0.079 (in 3 folds),0.805 +/- 0.070 (in 3 folds),0.497 +/- 0.144 (in 3 folds),0.805,0.479,disease.separate_past_exposures,0.798 +/- 0.065 (in 3 folds),0.482 +/- 0.130 (in 3 folds),0.012 +/- 0.000 (in 2 folds),0.798,0.468,0.008,Unknown,disease.separate_past_exposures,256,2,258,0.007752,False,0.827 +/- 0.000 (in 1 folds),0.827 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds),0.652 +/- 0.000 (in 1 folds)
lasso_cv,0.837 +/- 0.032 (in 3 folds),0.837 +/- 0.032 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.820 +/- 0.042 (in 3 folds),0.457 +/- 0.143 (in 3 folds),0.82,0.461,disease.separate_past_exposures,0.810 +/- 0.027 (in 3 folds),0.433 +/- 0.106 (in 3 folds),0.035 +/- 0.000 (in 1 folds),0.81,0.429,0.012,Unknown,disease.separate_past_exposures,255,3,258,0.011628,False,0.848 +/- 0.038 (in 2 folds),0.848 +/- 0.038 (in 2 folds),0.733 +/- 0.111 (in 2 folds),0.733 +/- 0.111 (in 2 folds)
lasso_cv.decision_thresholds_tuned,0.837 +/- 0.032 (in 3 folds),0.837 +/- 0.032 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.736 +/- 0.078 (in 3 folds),0.824 +/- 0.079 (in 3 folds),0.538 +/- 0.158 (in 3 folds),0.824,0.509,disease.separate_past_exposures,0.814 +/- 0.073 (in 3 folds),0.513 +/- 0.147 (in 3 folds),0.035 +/- 0.000 (in 1 folds),0.814,0.493,0.012,Unknown,disease.separate_past_exposures,255,3,258,0.011628,False,0.848 +/- 0.038 (in 2 folds),0.848 +/- 0.038 (in 2 folds),0.733 +/- 0.111 (in 2 folds),0.733 +/- 0.111 (in 2 folds)
lasso_multiclass,0.835 +/- 0.027 (in 3 folds),0.835 +/- 0.027 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.830 +/- 0.041 (in 3 folds),0.552 +/- 0.085 (in 3 folds),0.83,0.548,disease.separate_past_exposures,0.814 +/- 0.051 (in 3 folds),0.525 +/- 0.095 (in 3 folds),0.019 +/- 0.013 (in 3 folds),0.814,0.518,0.019,Unknown,disease.separate_past_exposures,253,5,258,0.01938,False,,,,
lasso_multiclass.decision_thresholds_tuned,0.835 +/- 0.027 (in 3 folds),0.835 +/- 0.027 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.709 +/- 0.105 (in 3 folds),0.830 +/- 0.030 (in 3 folds),0.524 +/- 0.079 (in 3 folds),0.83,0.524,disease.separate_past_exposures,0.814 +/- 0.040 (in 3 folds),0.493 +/- 0.093 (in 3 folds),0.019 +/- 0.013 (in 3 folds),0.814,0.489,0.019,Unknown,disease.separate_past_exposures,253,5,258,0.01938,False,,,,


rf_multiclass,rf_multiclass.decision_thresholds_tuned,xgboost,xgboost.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.871 +/- 0.044 (in 3 folds) ROC-AUC (macro OvO): 0.871 +/- 0.044 (in 3 folds) au-PRC (weighted OvO): 0.754 +/- 0.084 (in 3 folds) au-PRC (macro OvO): 0.754 +/- 0.084 (in 3 folds) Accuracy: 0.850 +/- 0.010 (in 3 folds) MCC: 0.592 +/- 0.047 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.850 MCC: 0.587 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.837 +/- 0.022 (in 3 folds) MCC: 0.566 +/- 0.072 (in 3 folds) Unknown/abstention proportion: 0.023 +/- 0.017 (in 2 folds) ROC-AUC (weighted OvO): 0.889 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.889 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.778 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.778 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.837 MCC: 0.562 Unknown/abstention proportion: 0.016 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.89 0.90 0.90 194  Lupus 0.72 0.64 0.68 64  Unknown 0.00 0.00 0.00 0  accuracy 0.84 258  macro avg 0.54 0.51 0.52 258  weighted avg 0.85 0.84 0.84 258,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.871 +/- 0.044 (in 3 folds) ROC-AUC (macro OvO): 0.871 +/- 0.044 (in 3 folds) au-PRC (weighted OvO): 0.754 +/- 0.084 (in 3 folds) au-PRC (macro OvO): 0.754 +/- 0.084 (in 3 folds) Accuracy: 0.838 +/- 0.029 (in 3 folds) MCC: 0.550 +/- 0.135 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.839 MCC: 0.548 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.825 +/- 0.042 (in 3 folds) MCC: 0.526 +/- 0.157 (in 3 folds) Unknown/abstention proportion: 0.023 +/- 0.017 (in 2 folds) ROC-AUC (weighted OvO): 0.889 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.889 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.778 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.778 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.826 MCC: 0.524 Unknown/abstention proportion: 0.016 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.88 0.90 0.89 194  Lupus 0.70 0.59 0.64 64  Unknown 0.00 0.00 0.00 0  accuracy 0.83 258  macro avg 0.53 0.50 0.51 258  weighted avg 0.83 0.83 0.83 258,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.868 +/- 0.039 (in 3 folds) ROC-AUC (macro OvO): 0.868 +/- 0.039 (in 3 folds) au-PRC (weighted OvO): 0.746 +/- 0.070 (in 3 folds) au-PRC (macro OvO): 0.746 +/- 0.070 (in 3 folds) Accuracy: 0.824 +/- 0.019 (in 3 folds) MCC: 0.501 +/- 0.031 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.824 MCC: 0.492 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.889 +/- 0.023 (in 2 folds) ROC-AUC (macro OvO): 0.889 +/- 0.023 (in 2 folds) au-PRC (weighted OvO): 0.786 +/- 0.013 (in 2 folds) au-PRC (macro OvO): 0.786 +/- 0.013 (in 2 folds) Accuracy: 0.814 +/- 0.022 (in 3 folds) MCC: 0.485 +/- 0.045 (in 3 folds) Unknown/abstention proportion: 0.035 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.814 MCC: 0.475 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.86 0.91 0.88 194  Lupus 0.69 0.52 0.59 64  Unknown 0.00 0.00 0.00 0  accuracy 0.81 258  macro avg 0.51 0.48 0.49 258  weighted avg 0.81 0.81 0.81 258,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.868 +/- 0.039 (in 3 folds) ROC-AUC (macro OvO): 0.868 +/- 0.039 (in 3 folds) au-PRC (weighted OvO): 0.746 +/- 0.070 (in 3 folds) au-PRC (macro OvO): 0.746 +/- 0.070 (in 3 folds) Accuracy: 0.842 +/- 0.035 (in 3 folds) MCC: 0.539 +/- 0.121 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.843 MCC: 0.546 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.889 +/- 0.023 (in 2 folds) ROC-AUC (macro OvO): 0.889 +/- 0.023 (in 2 folds) au-PRC (weighted OvO): 0.786 +/- 0.013 (in 2 folds) au-PRC (macro OvO): 0.786 +/- 0.013 (in 2 folds) Accuracy: 0.833 +/- 0.050 (in 3 folds) MCC: 0.524 +/- 0.146 (in 3 folds) Unknown/abstention proportion: 0.035 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.833 MCC: 0.526 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.86 0.93 0.90 194  Lupus 0.76 0.53 0.62 64  Unknown 0.00 0.00 0.00 0  accuracy 0.83 258  macro avg 0.54 0.49 0.51 258  weighted avg 0.84 0.83 0.83 258
,,,


elasticnet_cv,elasticnet_cv.decision_thresholds_tuned,lasso_cv,lasso_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.838 +/- 0.023 (in 3 folds) ROC-AUC (macro OvO): 0.838 +/- 0.023 (in 3 folds) au-PRC (weighted OvO): 0.726 +/- 0.079 (in 3 folds) au-PRC (macro OvO): 0.726 +/- 0.079 (in 3 folds) Accuracy: 0.766 +/- 0.019 (in 3 folds) MCC: 0.181 +/- 0.156 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.766 MCC: 0.218 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.760 +/- 0.022 (in 3 folds) MCC: 0.148 +/- 0.159 (in 3 folds) Unknown/abstention proportion: 0.012 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.827 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.827 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.652 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.652 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.760 MCC: 0.164 Unknown/abstention proportion: 0.008 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.76 0.99 0.86 194  Lupus 1.00 0.06 0.12 64  Unknown 0.00 0.00 0.00 0  accuracy 0.76 258  macro avg 0.59 0.35 0.33 258  weighted avg 0.82 0.76 0.68 258,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.838 +/- 0.023 (in 3 folds) ROC-AUC (macro OvO): 0.838 +/- 0.023 (in 3 folds) au-PRC (weighted OvO): 0.726 +/- 0.079 (in 3 folds) au-PRC (macro OvO): 0.726 +/- 0.079 (in 3 folds) Accuracy: 0.805 +/- 0.070 (in 3 folds) MCC: 0.497 +/- 0.144 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.805 MCC: 0.479 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.798 +/- 0.065 (in 3 folds) MCC: 0.482 +/- 0.130 (in 3 folds) Unknown/abstention proportion: 0.012 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.827 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.827 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.652 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.652 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.798 MCC: 0.468 Unknown/abstention proportion: 0.008 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.87 0.86 0.87 194  Lupus 0.61 0.61 0.61 64  Unknown 0.00 0.00 0.00 0  accuracy 0.80 258  macro avg 0.49 0.49 0.49 258  weighted avg 0.81 0.80 0.80 258,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.837 +/- 0.032 (in 3 folds) ROC-AUC (macro OvO): 0.837 +/- 0.032 (in 3 folds) au-PRC (weighted OvO): 0.736 +/- 0.078 (in 3 folds) au-PRC (macro OvO): 0.736 +/- 0.078 (in 3 folds) Accuracy: 0.820 +/- 0.042 (in 3 folds) MCC: 0.457 +/- 0.143 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.820 MCC: 0.461 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.848 +/- 0.038 (in 2 folds) ROC-AUC (macro OvO): 0.848 +/- 0.038 (in 2 folds) au-PRC (weighted OvO): 0.733 +/- 0.111 (in 2 folds) au-PRC (macro OvO): 0.733 +/- 0.111 (in 2 folds) Accuracy: 0.810 +/- 0.027 (in 3 folds) MCC: 0.433 +/- 0.106 (in 3 folds) Unknown/abstention proportion: 0.035 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.810 MCC: 0.429 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.81 0.98 0.89 194  Lupus 0.95 0.28 0.43 64  Unknown 0.00 0.00 0.00 0  accuracy 0.81 258  macro avg 0.59 0.42 0.44 258  weighted avg 0.84 0.81 0.78 258,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.837 +/- 0.032 (in 3 folds) ROC-AUC (macro OvO): 0.837 +/- 0.032 (in 3 folds) au-PRC (weighted OvO): 0.736 +/- 0.078 (in 3 folds) au-PRC (macro OvO): 0.736 +/- 0.078 (in 3 folds) Accuracy: 0.824 +/- 0.079 (in 3 folds) MCC: 0.538 +/- 0.158 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.824 MCC: 0.509 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): ROC-AUC (weighted OvO): 0.848 +/- 0.038 (in 2 folds) ROC-AUC (macro OvO): 0.848 +/- 0.038 (in 2 folds) au-PRC (weighted OvO): 0.733 +/- 0.111 (in 2 folds) au-PRC (macro OvO): 0.733 +/- 0.111 (in 2 folds) Accuracy: 0.814 +/- 0.073 (in 3 folds) MCC: 0.513 +/- 0.147 (in 3 folds) Unknown/abstention proportion: 0.035 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.814 MCC: 0.493 Unknown/abstention proportion: 0.012 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.87 0.89 0.88 194  Lupus 0.66 0.58 0.62 64  Unknown 0.00 0.00 0.00 0  accuracy 0.81 258  macro avg 0.51 0.49 0.50 258  weighted avg 0.82 0.81 0.81 258
,,,


lasso_multiclass,lasso_multiclass.decision_thresholds_tuned,linearsvm_ovr,linearsvm_ovr.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.835 +/- 0.027 (in 3 folds) ROC-AUC (macro OvO): 0.835 +/- 0.027 (in 3 folds) au-PRC (weighted OvO): 0.709 +/- 0.105 (in 3 folds) au-PRC (macro OvO): 0.709 +/- 0.105 (in 3 folds) Accuracy: 0.830 +/- 0.041 (in 3 folds) MCC: 0.552 +/- 0.085 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.830 MCC: 0.548 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.814 +/- 0.051 (in 3 folds) MCC: 0.525 +/- 0.095 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.013 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.814 MCC: 0.518 Unknown/abstention proportion: 0.019 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.88 0.87 0.87 194  Lupus 0.67 0.66 0.66 64  Unknown 0.00 0.00 0.00 0  accuracy 0.81 258  macro avg 0.52 0.51 0.51 258  weighted avg 0.83 0.81 0.82 258,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.835 +/- 0.027 (in 3 folds) ROC-AUC (macro OvO): 0.835 +/- 0.027 (in 3 folds) au-PRC (weighted OvO): 0.709 +/- 0.105 (in 3 folds) au-PRC (macro OvO): 0.709 +/- 0.105 (in 3 folds) Accuracy: 0.830 +/- 0.030 (in 3 folds) MCC: 0.524 +/- 0.079 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.830 MCC: 0.524 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.814 +/- 0.040 (in 3 folds) MCC: 0.493 +/- 0.093 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.013 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.814 MCC: 0.489 Unknown/abstention proportion: 0.019 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.86 0.90 0.88 194  Lupus 0.71 0.56 0.63 64  Unknown 0.00 0.00 0.00 0  accuracy 0.81 258  macro avg 0.52 0.49 0.50 258  weighted avg 0.82 0.81 0.82 258,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.835 +/- 0.027 (in 3 folds) ROC-AUC (macro OvO): 0.835 +/- 0.027 (in 3 folds) au-PRC (weighted OvO): 0.709 +/- 0.104 (in 3 folds) au-PRC (macro OvO): 0.709 +/- 0.104 (in 3 folds) Accuracy: 0.834 +/- 0.034 (in 3 folds) MCC: 0.559 +/- 0.074 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.834 MCC: 0.556 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.818 +/- 0.044 (in 3 folds) MCC: 0.531 +/- 0.085 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.013 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.818 MCC: 0.526 Unknown/abstention proportion: 0.019 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.88 0.87 0.88 194  Lupus 0.68 0.66 0.67 64  Unknown 0.00 0.00 0.00 0  accuracy 0.82 258  macro avg 0.52 0.51 0.51 258  weighted avg 0.83 0.82 0.83 258,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.835 +/- 0.027 (in 3 folds) ROC-AUC (macro OvO): 0.835 +/- 0.027 (in 3 folds) au-PRC (weighted OvO): 0.709 +/- 0.104 (in 3 folds) au-PRC (macro OvO): 0.709 +/- 0.104 (in 3 folds) Accuracy: 0.830 +/- 0.030 (in 3 folds) MCC: 0.524 +/- 0.079 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.830 MCC: 0.524 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.814 +/- 0.040 (in 3 folds) MCC: 0.493 +/- 0.093 (in 3 folds) Unknown/abstention proportion: 0.019 +/- 0.013 (in 3 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.814 MCC: 0.489 Unknown/abstention proportion: 0.019 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.86 0.90 0.88 194  Lupus 0.71 0.56 0.63 64  Unknown 0.00 0.00 0.00 0  accuracy 0.81 258  macro avg 0.52 0.49 0.50 258  weighted avg 0.82 0.81 0.82 258
,,,


ridge_cv,ridge_cv.decision_thresholds_tuned
Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.835 +/- 0.018 (in 3 folds) ROC-AUC (macro OvO): 0.835 +/- 0.018 (in 3 folds) au-PRC (weighted OvO): 0.720 +/- 0.071 (in 3 folds) au-PRC (macro OvO): 0.720 +/- 0.071 (in 3 folds) Accuracy: 0.750 +/- 0.006 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.750 MCC: 0.000 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.744 +/- 0.010 (in 3 folds) MCC: -0.021 +/- 0.018 (in 3 folds) Unknown/abstention proportion: 0.012 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.827 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.827 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.650 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.650 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.744 MCC: -0.025 Unknown/abstention proportion: 0.008 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.75 0.99 0.85 194  Lupus 0.00 0.00 0.00 64  Unknown 0.00 0.00 0.00 0  accuracy 0.74 258  macro avg 0.25 0.33 0.28 258  weighted avg 0.56 0.74 0.64 258,Per-fold scores without abstention: ROC-AUC (weighted OvO): 0.835 +/- 0.018 (in 3 folds) ROC-AUC (macro OvO): 0.835 +/- 0.018 (in 3 folds) au-PRC (weighted OvO): 0.720 +/- 0.071 (in 3 folds) au-PRC (macro OvO): 0.720 +/- 0.071 (in 3 folds) Accuracy: 0.750 +/- 0.006 (in 3 folds) MCC: 0.000 +/- 0.000 (in 3 folds) Global scores without abstention using column name disease.separate_past_exposures: Accuracy: 0.750 MCC: 0.000 Global evaluation column name: disease.separate_past_exposures Per-fold scores with abstention (note that abstentions not included in probability-based scores): Accuracy: 0.744 +/- 0.010 (in 3 folds) MCC: -0.021 +/- 0.018 (in 3 folds) Unknown/abstention proportion: 0.012 +/- 0.000 (in 2 folds) ROC-AUC (weighted OvO): 0.827 +/- 0.000 (in 1 folds) ROC-AUC (macro OvO): 0.827 +/- 0.000 (in 1 folds) au-PRC (weighted OvO): 0.650 +/- 0.000 (in 1 folds) au-PRC (macro OvO): 0.650 +/- 0.000 (in 1 folds) Global scores with abstention using column name disease.separate_past_exposures: Accuracy: 0.744 MCC: -0.025 Unknown/abstention proportion: 0.008 Abstention label: Unknown Global evaluation column name: disease.separate_past_exposures Global classification report with abstention using column name disease.separate_past_exposures:  precision recall f1-score support Healthy/Background 0.75 0.99 0.85 194  Lupus 0.00 0.00 0.00 64  Unknown 0.00 0.00 0.00 0  accuracy 0.74 258  macro avg 0.25 0.33 0.28 258  weighted avg 0.56 0.74 0.64 258
,


---