In [1]:
import sys

sys.path.insert(0, "../")

import pandas as pd
from mdu.eval.table_analysis_utils import (
    transform_by_tasks,
    select_composite_and_components,
    check_composite_dominance,
    compute_average_ranks,
    analyze_composite_pareto_performance,
)
from notebooks.table_utils import with_avg_row, mean_pm_std, fmt_valvar
from mdu.unc.constants import OTTarget, ScalingType

# Set pandas display options to show all columns
pd.set_option("display.max_columns", None)
pd.set_option("display.width", None)
pd.set_option("display.max_colwidth", None)

%load_ext autoreload
%autoreload 2

In [2]:
target_distr = OTTarget.BETA.value
scaling_type = ScalingType.FEATURE_WISE.value
grid_size = 5
n_targets_multiplier = 1


df = pd.read_csv(
    f"../resources/refactored/benchmark_entropic_target_{target_distr}_eps_0.5_scaling_type_{scaling_type}_iters_1000_tol_1e-06_rs_42_grid_size_{grid_size}_n_targets_multiplier_{n_targets_multiplier}.csv"
)

In [3]:
df.head(10)

Unnamed: 0,ind_dataset,ood_dataset,measure,uncertainty_type,gname,risk_type,gt_approximation,pred_approximation,ensemble_group,problem_type,roc_auc,average_precision,accuracy,aurc,acc_cov_auc,coverage_at_1pct_error,coverage_at_2pct_error,coverage_at_5pct_error,n_ind_samples,n_ood_samples,n_correct,n_incorrect,ensemble_accuracy
0,cifar10,cifar100,Risk_LogScore_TotalRisk_outer_outer,Risk,LogScore,TotalRisk,outer,outer,0,ood_detection,0.912015,,,,,,,,7200,10000.0,,,0.96375
1,cifar10,cifar10,Risk_LogScore_TotalRisk_outer_outer,Risk,LogScore,TotalRisk,outer,outer,0,misclassification_detection,0.944999,0.381728,0.96375,,,,,,7200,,6939.0,261.0,0.96375
2,cifar10,cifar10,Risk_LogScore_TotalRisk_outer_outer,Risk,LogScore,TotalRisk,outer,outer,0,selective_prediction,,,0.96375,0.002928,0.996933,0.000139,0.000139,0.000139,7200,,,,0.96375
3,cifar10,cifar100,Risk_LogScore_TotalRisk_outer_outer,Risk,LogScore,TotalRisk,outer,outer,1,ood_detection,0.91069,,,,,,,,7200,10000.0,,,0.964306
4,cifar10,cifar10,Risk_LogScore_TotalRisk_outer_outer,Risk,LogScore,TotalRisk,outer,outer,1,misclassification_detection,0.94461,0.374033,0.964306,,,,,,7200,,6943.0,257.0,0.964306
5,cifar10,cifar10,Risk_LogScore_TotalRisk_outer_outer,Risk,LogScore,TotalRisk,outer,outer,1,selective_prediction,,,0.964306,0.00293,0.996931,0.000139,0.000139,0.000139,7200,,,,0.964306
6,cifar10,cifar100,Risk_LogScore_TotalRisk_outer_outer,Risk,LogScore,TotalRisk,outer,outer,2,ood_detection,0.911888,,,,,,,,7200,10000.0,,,0.963333
7,cifar10,cifar10,Risk_LogScore_TotalRisk_outer_outer,Risk,LogScore,TotalRisk,outer,outer,2,misclassification_detection,0.943641,0.360288,0.963333,,,,,,7200,,6936.0,264.0,0.963333
8,cifar10,cifar10,Risk_LogScore_TotalRisk_outer_outer,Risk,LogScore,TotalRisk,outer,outer,2,selective_prediction,,,0.963333,0.003023,0.996838,0.000139,0.000139,0.000139,7200,,,,0.963333
9,cifar10,cifar100,Risk_LogScore_TotalRisk_outer_outer,Risk,LogScore,TotalRisk,outer,outer,3,ood_detection,0.911436,,,,,,,,7200,10000.0,,,0.964167


In [4]:
print(df.ind_dataset.unique())
print(df.ood_dataset.unique())

['cifar10' 'cifar100' 'tiny_imagenet']
['cifar100' 'cifar10' 'tiny_imagenet' 'svhn' 'imagenet_a' 'imagenet_o'
 'imagenet_r']


In [5]:
include_std = True

if not include_std:
    transformed_df = transform_by_tasks(df, include_std=include_std)
else:
    transformed_df, std_df = transform_by_tasks(df, include_std=include_std)

In [6]:
transformed_df

Unnamed: 0_level_0,measure,R_b 1 (Brier),R_b 1 (Logscore),R_b 1 (Spherical),R_b 1 (Zero-one),R_b 2 (Brier),R_b 2 (Logscore),R_b 2 (Spherical),R_b 2 (Zero-one),R_b 3 (Brier),R_b 3 (Logscore),R_b 3 (Spherical),R_b 3 (Zero-one),R_e 1 1 (Brier),R_e 1 1 (Logscore),R_e 1 1 (Spherical),R_e 1 1 (Zero-one),R_e 1 2 (Brier),R_e 1 2 (Logscore),R_e 1 2 (Spherical),R_e 1 2 (Zero-one),R_e 1 3 (Brier),R_e 1 3 (Logscore),R_e 1 3 (Spherical),R_e 1 3 (Zero-one),R_e 2 1 (Brier),R_e 2 1 (Logscore),R_e 2 1 (Spherical),R_e 2 1 (Zero-one),R_e 2 2 (Brier),R_e 2 2 (Logscore),R_e 2 2 (Spherical),R_e 2 2 (Zero-one),R_e 2 3 (Brier),R_e 2 3 (Logscore),R_e 2 3 (Spherical),R_e 2 3 (Zero-one),R_e 3 1 (Brier),R_e 3 1 (Logscore),R_e 3 1 (Spherical),R_e 3 1 (Zero-one),R_e 3 2 (Brier),R_e 3 2 (Logscore),R_e 3 2 (Spherical),R_e 3 2 (Zero-one),R_e 3 3 (Brier),R_e 3 3 (Logscore),R_e 3 3 (Spherical),R_e 3 3 (Zero-one),R_t 1 1 (Brier),R_t 1 1 (Logscore),R_t 1 1 (Spherical),R_t 1 1 (Zero-one),R_t 1 2 (Brier),R_t 1 2 (Logscore),R_t 1 2 (Spherical),R_t 1 2 (Zero-one),R_t 1 3 (Brier),R_t 1 3 (Logscore),R_t 1 3 (Spherical),R_t 1 3 (Zero-one),R_t 2 1 (Brier),R_t 2 1 (Logscore),R_t 2 1 (Spherical),R_t 2 1 (Zero-one),R_t 2 2 (Brier),R_t 2 2 (Logscore),R_t 2 2 (Spherical),R_t 2 2 (Zero-one),R_t 2 3 (Brier),R_t 2 3 (Logscore),R_t 2 3 (Spherical),R_t 2 3 (Zero-one),R_t 3 1 (Brier),R_t 3 1 (Logscore),R_t 3 1 (Spherical),R_t 3 1 (Zero-one),R_t 3 2 (Brier),R_t 3 2 (Logscore),R_t 3 2 (Spherical),R_t 3 2 (Zero-one),R_t 3 3 (Brier),R_t 3 3 (Logscore),R_t 3 3 (Spherical),R_t 3 3 (Zero-one),composite bayes all central,composite bayes all central + m,composite bayes all inner,composite bayes all inner + m,composite bayes all outer,composite bayes all outer + m,composite eat logscore central inner,composite eat logscore central inner + m,composite eat logscore central outer,composite eat logscore central outer + m,composite eat logscore inner central,composite eat logscore inner central + m,composite eat logscore inner outer,composite eat logscore inner outer + m,composite eat logscore outer central,composite eat logscore outer central + m,composite eat logscore outer inner,composite eat logscore outer inner + m,composite eat logscore outer outer,composite eat logscore outer outer + m,composite eat spherical central inner,composite eat spherical central inner + m,composite eat spherical central outer,composite eat spherical central outer + m,composite eat spherical inner central,composite eat spherical inner central + m,composite eat spherical inner outer,composite eat spherical inner outer + m,composite eat spherical outer central,composite eat spherical outer central + m,composite eat spherical outer inner,composite eat spherical outer inner + m,composite eat spherical outer outer,composite eat spherical outer outer + m,composite excess all central inner,composite excess all central inner + m,composite excess all central outer,composite excess all central outer + m,composite excess all inner central,composite excess all inner central + m,composite excess all inner outer,composite excess all inner outer + m,composite excess all outer central,composite excess all outer central + m,composite excess all outer inner,composite excess all outer inner + m,composite excess all outer outer,composite excess all outer outer + m,composite total central inner,composite total central inner + m,composite total central outer,composite total central outer + m,composite total inner central,composite total inner central + m,composite total inner outer,composite total inner outer + m,composite total outer central,composite total outer central + m,composite total outer inner,composite total outer inner + m,composite total outer outer,composite total outer outer + m,gmm,mahalanobis
ind_dataset,eval,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1
cifar10,cifar10 [miscls],0.942466,0.942267,0.942228,0.941776,0.945782,0.944886,0.945782,0.945872,0.945782,0.944413,0.943949,0.945872,0.942366,0.94043,0.943107,0.798849,0.942365,0.941645,0.941898,0.796675,0.942365,0.936452,0.942409,0.796675,0.942365,0.939707,0.941616,0.79584,0.5,0.5,0.5,0.5,0.5,0.915035,0.926371,0.5,0.942365,0.943296,0.942258,0.79584,0.5,0.921213,0.914136,0.5,0.5,0.5,0.5,0.5,0.945045,0.943244,0.945171,0.945431,0.945782,0.944886,0.945782,0.945871,0.945782,0.942223,0.94564,0.945871,0.945045,0.943245,0.945171,0.945432,0.945782,0.944886,0.945782,0.945872,0.945782,0.942223,0.94564,0.945872,0.945045,0.944547,0.943559,0.945432,0.945782,0.944624,0.943767,0.945872,0.945782,0.944413,0.943949,0.945872,0.94531,0.945707,0.94575,0.945697,0.942215,0.942168,0.942462,0.943096,0.944448,0.944807,0.939078,0.93977,0.943103,0.943618,0.941745,0.942006,0.944762,0.944299,0.943764,0.943972,0.942477,0.942925,0.943038,0.943216,0.944622,0.944132,0.944567,0.944118,0.945507,0.944649,0.945688,0.944717,0.945234,0.944483,0.935861,0.936884,0.941871,0.940037,0.934109,0.935814,0.940514,0.939308,0.941534,0.940975,0.942911,0.941753,0.942233,0.941031,0.945199,0.945598,0.944752,0.945196,0.945364,0.945428,0.944912,0.945123,0.945363,0.945428,0.94575,0.945697,0.944912,0.945123,0.908478,0.927621
cifar10,cifar10 [selective],0.996836,0.996818,0.996827,0.99681,0.996959,0.99692,0.996959,0.996962,0.996959,0.996793,0.996891,0.996962,0.996913,0.996843,0.996936,0.98468,0.996913,0.996886,0.996698,0.982762,0.996913,0.996693,0.996769,0.982762,0.996913,0.996818,0.996751,0.983991,0.963044,0.963044,0.963044,0.963044,0.963044,0.995857,0.995431,0.963044,0.996913,0.996954,0.996802,0.983991,0.963044,0.996096,0.993922,0.963044,0.963044,0.963044,0.963044,0.963044,0.996931,0.996864,0.996936,0.996946,0.996959,0.99692,0.996959,0.996962,0.996959,0.996823,0.996954,0.996962,0.996932,0.996864,0.996936,0.996946,0.996959,0.99692,0.996959,0.996962,0.996959,0.996823,0.996954,0.996962,0.996932,0.99683,0.996876,0.996946,0.996959,0.996818,0.996884,0.996962,0.996959,0.996793,0.996891,0.996962,0.996909,0.996986,0.996955,0.996989,0.996821,0.996862,0.996762,0.996886,0.996831,0.996945,0.996709,0.996768,0.99686,0.996908,0.996807,0.996853,0.996918,0.996938,0.996882,0.996923,0.996837,0.996871,0.996857,0.996881,0.996916,0.996916,0.996914,0.996915,0.996949,0.996937,0.996955,0.99694,0.996938,0.99693,0.996668,0.99664,0.996903,0.996753,0.996578,0.996598,0.996851,0.996728,0.996881,0.99679,0.996933,0.996819,0.996911,0.996791,0.996906,0.996982,0.996896,0.996964,0.996941,0.996979,0.996926,0.996964,0.996941,0.996979,0.996955,0.996989,0.996926,0.996964,0.995186,0.996266
cifar10,cifar100 [ood],0.914436,0.916906,0.914506,0.913191,0.913049,0.916237,0.913049,0.91123,0.913049,0.912008,0.909164,0.91123,0.902342,0.90473,0.904375,0.753831,0.902342,0.907203,0.902404,0.754648,0.902342,0.902604,0.903989,0.754648,0.902343,0.903442,0.901813,0.751104,0.5,0.5,0.5,0.5,0.5,0.886252,0.871818,0.5,0.902343,0.906725,0.902784,0.751104,0.5,0.891379,0.859924,0.5,0.5,0.5,0.5,0.5,0.910004,0.911507,0.911267,0.911053,0.913049,0.916237,0.913049,0.91123,0.913049,0.915012,0.91258,0.91123,0.910004,0.911507,0.911267,0.911053,0.913049,0.916237,0.913049,0.91123,0.913049,0.915012,0.91258,0.91123,0.910004,0.910125,0.907795,0.911053,0.913049,0.912355,0.908703,0.91123,0.913049,0.912008,0.909164,0.91123,0.911458,0.916188,0.913361,0.917286,0.914757,0.918552,0.911548,0.917616,0.909821,0.916069,0.912446,0.917708,0.911133,0.916611,0.91418,0.918787,0.915309,0.919366,0.912921,0.917981,0.905485,0.911915,0.906203,0.912027,0.910118,0.914651,0.909678,0.914102,0.91205,0.915964,0.912293,0.916103,0.911517,0.915542,0.899801,0.906773,0.904244,0.906634,0.897684,0.906262,0.903081,0.905827,0.903889,0.906506,0.905259,0.907384,0.904362,0.906492,0.9114,0.916118,0.909804,0.914654,0.91305,0.917036,0.911142,0.91537,0.91305,0.917036,0.913361,0.917286,0.911142,0.91537,0.899817,0.912238
cifar10,svhn [ood],0.958357,0.962992,0.95853,0.956294,0.957686,0.96315,0.957686,0.954723,0.957686,0.960044,0.951817,0.954723,0.940173,0.942616,0.941999,0.82336,0.940173,0.945786,0.942129,0.824603,0.940173,0.939684,0.941816,0.824603,0.940173,0.940879,0.94114,0.817941,0.5,0.5,0.5,0.5,0.5,0.916405,0.931379,0.5,0.940173,0.945094,0.942173,0.817941,0.5,0.923651,0.929676,0.5,0.5,0.5,0.5,0.5,0.953304,0.956506,0.955074,0.954225,0.957686,0.96315,0.957686,0.954722,0.957686,0.961888,0.957069,0.954722,0.953304,0.956506,0.955074,0.954225,0.957686,0.96315,0.957686,0.954723,0.957686,0.961888,0.957069,0.954723,0.953304,0.956816,0.949716,0.954225,0.957686,0.960396,0.951144,0.954723,0.957686,0.960044,0.951817,0.954723,0.956342,0.95546,0.958291,0.95708,0.959149,0.957428,0.95939,0.957043,0.956325,0.954897,0.958347,0.956338,0.955968,0.955474,0.960818,0.958548,0.961855,0.959268,0.958802,0.957479,0.946614,0.947329,0.947366,0.947741,0.953561,0.952546,0.952671,0.951884,0.95633,0.954567,0.956686,0.954795,0.955431,0.9539,0.935593,0.937999,0.94172,0.941481,0.932508,0.935641,0.940345,0.94045,0.941313,0.941868,0.943061,0.943094,0.94191,0.942005,0.956284,0.95542,0.953772,0.9534,0.95795,0.956827,0.955087,0.954516,0.95795,0.956827,0.958291,0.95708,0.955087,0.954516,0.945122,0.934311
cifar10,tiny_imagenet [ood],0.908611,0.911364,0.908679,0.90721,0.905817,0.909549,0.905817,0.903803,0.905817,0.905885,0.901146,0.903803,0.893229,0.895731,0.895592,0.751893,0.893229,0.898685,0.893123,0.752376,0.893229,0.893504,0.894407,0.752376,0.893229,0.894216,0.892264,0.750169,0.5,0.5,0.5,0.5,0.5,0.876192,0.863491,0.5,0.893229,0.89802,0.893819,0.750169,0.5,0.88156,0.854579,0.5,0.5,0.5,0.5,0.5,0.902105,0.903615,0.903609,0.903474,0.905817,0.909549,0.905816,0.903803,0.905817,0.907927,0.905196,0.903803,0.902105,0.903615,0.903609,0.903475,0.905817,0.909549,0.905817,0.903803,0.905817,0.907927,0.905195,0.903803,0.902105,0.90285,0.899536,0.903475,0.905817,0.905847,0.900596,0.903803,0.905817,0.905885,0.901146,0.903803,0.904165,0.9103,0.906199,0.911467,0.908978,0.914002,0.904297,0.91221,0.902436,0.910507,0.905055,0.912134,0.903171,0.910442,0.906896,0.913213,0.908262,0.913944,0.905279,0.912092,0.896792,0.905456,0.897663,0.905623,0.902194,0.908592,0.901726,0.907981,0.904546,0.91023,0.904868,0.910436,0.903902,0.909721,0.890309,0.899912,0.895224,0.899539,0.887902,0.899597,0.893932,0.898523,0.895018,0.899209,0.896608,0.900295,0.895476,0.899254,0.904041,0.91017,0.902015,0.908349,0.905751,0.911102,0.903385,0.909027,0.905751,0.911102,0.906199,0.911467,0.903385,0.909027,0.899828,0.910273
cifar100,cifar10 [ood],0.773,0.77327,0.773388,0.772177,0.774385,0.774538,0.774385,0.771173,0.774385,0.775281,0.762904,0.771173,0.681292,0.724548,0.717172,0.675933,0.681292,0.736746,0.72158,0.689059,0.681292,0.718033,0.714663,0.689059,0.681292,0.716302,0.711027,0.672513,0.5,0.5,0.5,0.5,0.5,0.616365,0.698336,0.5,0.681292,0.729777,0.731558,0.672513,0.5,0.642769,0.716916,0.5,0.5,0.5,0.5,0.5,0.769313,0.774023,0.773545,0.770729,0.774385,0.774538,0.774385,0.771173,0.774385,0.774192,0.773969,0.771173,0.769313,0.774023,0.773545,0.770729,0.774385,0.774538,0.774385,0.771173,0.774385,0.774192,0.773969,0.771173,0.769313,0.775125,0.7583,0.770729,0.774385,0.775507,0.759703,0.771173,0.774385,0.775281,0.762904,0.771173,0.773897,0.768981,0.774314,0.769471,0.77331,0.768658,0.772453,0.763502,0.77318,0.76296,0.76888,0.761143,0.771035,0.763377,0.772023,0.765058,0.773934,0.766795,0.772271,0.76479,0.73346,0.726607,0.742945,0.735063,0.767757,0.757583,0.768135,0.758395,0.770902,0.761256,0.771546,0.762149,0.770645,0.761095,0.69879,0.680565,0.7102,0.698633,0.67137,0.637771,0.70182,0.689606,0.710276,0.698776,0.717831,0.705528,0.709955,0.697744,0.773856,0.768918,0.772499,0.767078,0.774217,0.769363,0.773314,0.768061,0.774217,0.769363,0.774314,0.769471,0.773314,0.768061,0.62039,0.534822
cifar100,cifar100 [miscls],0.857773,0.845094,0.856181,0.858986,0.865555,0.850089,0.865555,0.870135,0.865555,0.858536,0.86465,0.870135,0.782572,0.818006,0.82975,0.785608,0.782572,0.831543,0.83724,0.806319,0.782572,0.8042,0.827383,0.806319,0.782572,0.808522,0.818866,0.758041,0.5,0.5,0.5,0.5,0.5,0.653943,0.803837,0.5,0.782572,0.828096,0.842536,0.758041,0.5,0.690839,0.821959,0.5,0.5,0.5,0.5,0.5,0.866375,0.853064,0.867947,0.86996,0.865555,0.850089,0.865555,0.870135,0.865555,0.84881,0.867136,0.870135,0.866375,0.853064,0.867948,0.86996,0.865555,0.850089,0.865555,0.870135,0.865555,0.84881,0.867136,0.870135,0.866375,0.861057,0.862191,0.86996,0.865555,0.858551,0.862191,0.870135,0.865555,0.858536,0.86465,0.870135,0.867556,0.865852,0.864266,0.862462,0.855261,0.853341,0.849985,0.843049,0.861422,0.853821,0.838427,0.833501,0.852731,0.848176,0.849641,0.845758,0.854882,0.850801,0.853508,0.849159,0.838265,0.834956,0.851391,0.846659,0.865506,0.85924,0.867017,0.86095,0.868471,0.8624,0.869254,0.863207,0.868659,0.862668,0.791191,0.775738,0.812647,0.803934,0.761491,0.728523,0.801925,0.79248,0.819044,0.810417,0.828895,0.819411,0.817947,0.808624,0.867564,0.865844,0.868187,0.866175,0.864622,0.862832,0.866182,0.864096,0.864622,0.862831,0.864266,0.862462,0.866182,0.864096,0.661662,0.573908
cifar100,cifar100 [selective],0.920203,0.915943,0.919719,0.920576,0.922462,0.917541,0.922462,0.92372,0.922462,0.920209,0.922336,0.92372,0.899957,0.909667,0.914149,0.880184,0.899957,0.913284,0.916155,0.878853,0.899957,0.90564,0.913539,0.878853,0.899956,0.907047,0.91114,0.862183,0.74984,0.74984,0.74984,0.74984,0.74984,0.856236,0.905865,0.74984,0.899956,0.912781,0.917248,0.862183,0.74984,0.869099,0.910593,0.74984,0.74984,0.74984,0.74984,0.74984,0.922771,0.918425,0.923118,0.923681,0.922462,0.917541,0.922462,0.923719,0.922462,0.917088,0.922896,0.923719,0.922771,0.918425,0.923118,0.923681,0.922462,0.917541,0.922462,0.92372,0.922462,0.917088,0.922896,0.92372,0.922771,0.921044,0.921776,0.923681,0.922462,0.920294,0.921776,0.92372,0.922462,0.920209,0.922336,0.92372,0.92308,0.921382,0.922002,0.920265,0.919374,0.917596,0.91748,0.913191,0.921188,0.916262,0.913828,0.910473,0.918398,0.915266,0.91732,0.914529,0.918973,0.916009,0.918591,0.915536,0.916049,0.913338,0.919254,0.916246,0.922557,0.91836,0.922939,0.918888,0.92327,0.919192,0.923478,0.919428,0.923327,0.919304,0.902139,0.89322,0.909242,0.9031,0.892972,0.876317,0.90619,0.89975,0.910219,0.904367,0.913108,0.906847,0.910254,0.9039,0.923071,0.921371,0.92323,0.921406,0.922083,0.920361,0.922518,0.920665,0.922083,0.920361,0.922002,0.920265,0.922518,0.920665,0.842324,0.81055
cifar100,svhn [ood],0.858293,0.87012,0.86097,0.855937,0.856738,0.870178,0.856738,0.846668,0.856738,0.867147,0.827973,0.846668,0.662081,0.755848,0.723351,0.679433,0.662081,0.77634,0.731242,0.705718,0.662081,0.749942,0.718591,0.705718,0.662081,0.742349,0.713226,0.683783,0.5,0.5,0.5,0.5,0.5,0.618154,0.692685,0.5,0.662081,0.761028,0.750824,0.683783,0.5,0.651612,0.728006,0.5,0.5,0.5,0.5,0.5,0.839867,0.867727,0.852639,0.844381,0.856738,0.870178,0.856738,0.846668,0.856738,0.870307,0.854648,0.846668,0.839867,0.867727,0.852639,0.844381,0.856738,0.870178,0.856738,0.846668,0.856738,0.870307,0.854648,0.846668,0.839867,0.864736,0.815066,0.844381,0.856738,0.867298,0.819928,0.846668,0.856738,0.867147,0.827973,0.846668,0.855796,0.862481,0.858672,0.864237,0.861924,0.867208,0.863742,0.870301,0.858499,0.864398,0.866185,0.874833,0.86012,0.867458,0.864849,0.872346,0.865641,0.873233,0.862869,0.870357,0.760593,0.777544,0.777238,0.79273,0.838154,0.846729,0.837161,0.844719,0.845427,0.853246,0.846624,0.853869,0.844065,0.851579,0.706587,0.716508,0.715936,0.72199,0.658771,0.665012,0.703075,0.708337,0.717968,0.723638,0.730109,0.734826,0.715296,0.720123,0.855702,0.862376,0.851355,0.85816,0.858228,0.863901,0.854767,0.860731,0.858228,0.863901,0.858672,0.864237,0.854767,0.860731,0.710019,0.678832
cifar100,tiny_imagenet [ood],0.789521,0.809888,0.806267,0.803022,0.937085,0.926019,0.937085,0.946611,0.937085,0.995658,0.999927,0.946611,0.953406,0.999852,0.991516,0.973368,0.953406,0.999942,0.994416,0.976322,0.953406,0.9999,0.989533,0.976322,0.953406,0.999722,0.979255,0.792076,0.5,0.5,0.5,0.5,0.5,0.997001,0.953196,0.5,0.953406,0.999561,0.998722,0.792076,0.5,0.999526,0.990813,0.5,0.5,0.5,0.5,0.5,0.99913,0.999997,0.992987,0.965251,0.937085,0.926019,0.937085,0.946611,0.937085,0.979732,0.979339,0.946611,0.99913,0.999997,0.992987,0.965251,0.937085,0.926019,0.937085,0.946611,0.937085,0.979732,0.979339,0.946611,0.99913,0.999972,0.999972,0.965251,0.937085,0.998817,0.999942,0.946611,0.937085,0.995658,0.999927,0.946611,0.981943,0.981906,0.937878,0.939526,0.80281,0.804428,0.999991,0.999986,0.999996,0.999991,0.999952,0.999934,0.999999,0.999997,0.999998,0.999993,0.99994,0.999887,1.0,0.999998,0.994982,0.993658,0.999404,0.997104,0.999574,0.998939,0.999937,0.99959,0.999908,0.99957,0.999292,0.998815,0.999919,0.999589,0.999105,0.998867,0.993652,0.992437,0.993809,0.992579,0.989008,0.987311,0.995487,0.994582,0.995336,0.994481,0.994084,0.993126,0.99504,0.994024,0.999957,0.999919,0.968206,0.969222,0.999916,0.999857,0.968206,0.969222,0.937878,0.939526,0.999916,0.999857,0.563975,0.622941


In [7]:
std_df

Unnamed: 0_level_0,Unnamed: 1_level_0,R_b 1 (Brier),R_b 1 (Logscore),R_b 1 (Spherical),R_b 1 (Zero-one),R_b 2 (Brier),R_b 2 (Logscore),R_b 2 (Spherical),R_b 2 (Zero-one),R_b 3 (Brier),R_b 3 (Logscore),R_b 3 (Spherical),R_b 3 (Zero-one),R_e 1 1 (Brier),R_e 1 1 (Logscore),R_e 1 1 (Spherical),R_e 1 1 (Zero-one),R_e 1 2 (Brier),R_e 1 2 (Logscore),R_e 1 2 (Spherical),R_e 1 2 (Zero-one),R_e 1 3 (Brier),R_e 1 3 (Logscore),R_e 1 3 (Spherical),R_e 1 3 (Zero-one),R_e 2 1 (Brier),R_e 2 1 (Logscore),R_e 2 1 (Spherical),R_e 2 1 (Zero-one),R_e 2 2 (Brier),R_e 2 2 (Logscore),R_e 2 2 (Spherical),R_e 2 2 (Zero-one),R_e 2 3 (Brier),R_e 2 3 (Logscore),R_e 2 3 (Spherical),R_e 2 3 (Zero-one),R_e 3 1 (Brier),R_e 3 1 (Logscore),R_e 3 1 (Spherical),R_e 3 1 (Zero-one),R_e 3 2 (Brier),R_e 3 2 (Logscore),R_e 3 2 (Spherical),R_e 3 2 (Zero-one),R_e 3 3 (Brier),R_e 3 3 (Logscore),R_e 3 3 (Spherical),R_e 3 3 (Zero-one),R_t 1 1 (Brier),R_t 1 1 (Logscore),R_t 1 1 (Spherical),R_t 1 1 (Zero-one),R_t 1 2 (Brier),R_t 1 2 (Logscore),R_t 1 2 (Spherical),R_t 1 2 (Zero-one),R_t 1 3 (Brier),R_t 1 3 (Logscore),R_t 1 3 (Spherical),R_t 1 3 (Zero-one),R_t 2 1 (Brier),R_t 2 1 (Logscore),R_t 2 1 (Spherical),R_t 2 1 (Zero-one),R_t 2 2 (Brier),R_t 2 2 (Logscore),R_t 2 2 (Spherical),R_t 2 2 (Zero-one),R_t 2 3 (Brier),R_t 2 3 (Logscore),R_t 2 3 (Spherical),R_t 2 3 (Zero-one),R_t 3 1 (Brier),R_t 3 1 (Logscore),R_t 3 1 (Spherical),R_t 3 1 (Zero-one),R_t 3 2 (Brier),R_t 3 2 (Logscore),R_t 3 2 (Spherical),R_t 3 2 (Zero-one),R_t 3 3 (Brier),R_t 3 3 (Logscore),R_t 3 3 (Spherical),R_t 3 3 (Zero-one),composite bayes all central,composite bayes all central + m,composite bayes all inner,composite bayes all inner + m,composite bayes all outer,composite bayes all outer + m,composite eat logscore central inner,composite eat logscore central inner + m,composite eat logscore central outer,composite eat logscore central outer + m,composite eat logscore inner central,composite eat logscore inner central + m,composite eat logscore inner outer,composite eat logscore inner outer + m,composite eat logscore outer central,composite eat logscore outer central + m,composite eat logscore outer inner,composite eat logscore outer inner + m,composite eat logscore outer outer,composite eat logscore outer outer + m,composite eat spherical central inner,composite eat spherical central inner + m,composite eat spherical central outer,composite eat spherical central outer + m,composite eat spherical inner central,composite eat spherical inner central + m,composite eat spherical inner outer,composite eat spherical inner outer + m,composite eat spherical outer central,composite eat spherical outer central + m,composite eat spherical outer inner,composite eat spherical outer inner + m,composite eat spherical outer outer,composite eat spherical outer outer + m,composite excess all central inner,composite excess all central inner + m,composite excess all central outer,composite excess all central outer + m,composite excess all inner central,composite excess all inner central + m,composite excess all inner outer,composite excess all inner outer + m,composite excess all outer central,composite excess all outer central + m,composite excess all outer inner,composite excess all outer inner + m,composite excess all outer outer,composite excess all outer outer + m,composite total central inner,composite total central inner + m,composite total central outer,composite total central outer + m,composite total inner central,composite total inner central + m,composite total inner outer,composite total inner outer + m,composite total outer central,composite total outer central + m,composite total outer inner,composite total outer inner + m,composite total outer outer,composite total outer outer + m,gmm,mahalanobis
ind_dataset,eval,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1
cifar10,cifar10 [miscls],0.00156,0.001585,0.001625,0.001838,0.002001,0.001597,0.002001,0.002047,0.002001,0.002152,0.002248,0.002047,0.00319,0.003253,0.002757,0.009169,0.003191,0.003134,0.002478,0.007763,0.003191,0.002741,0.002774,0.007763,0.003189,0.00329,0.00337,0.010165,0.0,0.0,0.0,0.0,0.0,0.002458,0.005676,0.0,0.003189,0.003404,0.002794,0.010165,0.0,0.00257,0.004741,0.0,0.0,0.0,0.0,0.0,0.002336,0.002413,0.002195,0.00176,0.002001,0.001597,0.002001,0.002047,0.002001,0.001432,0.002068,0.002047,0.002336,0.002413,0.002195,0.00176,0.002001,0.001597,0.002001,0.002047,0.002001,0.001432,0.002068,0.002047,0.002336,0.002725,0.002298,0.00176,0.002001,0.002054,0.002244,0.002047,0.002001,0.002152,0.002248,0.002047,0.002108,0.001741,0.001987,0.001605,0.001612,0.001502,0.001342,0.001195,0.00274327,0.002153,0.001203,0.00096,0.002487834,0.002109,0.001478748,0.001218,0.001901,0.001473,0.002382536,0.001925,0.002359,0.002146,0.002357,0.002116,0.002316,0.002014,0.002304,0.001989,0.00217,0.001843,0.002133,0.001812,0.002183,0.001886,0.00266,0.001732,0.003021,0.002086,0.003089,0.002007,0.003013,0.002069,0.003113,0.002275,0.003174,0.002335,0.003163,0.002284,0.002105,0.001762,0.002302,0.002042,0.002034,0.001638,0.002243,0.001958,0.002034,0.001638,0.001987,0.001605,0.002243,0.001958,0.002864,0.002597
cifar10,cifar10 [selective],4.4e-05,4.9e-05,4.6e-05,5.2e-05,6.4e-05,5.4e-05,6.4e-05,6.7e-05,6.4e-05,0.000128,8.1e-05,6.7e-05,0.000131,0.000145,0.000108,0.000813,0.000131,0.000142,0.000146,0.001835,0.000131,0.000131,0.000201,0.001835,0.000131,0.000145,0.000158,0.001345,0.001269,0.001269,0.001269,0.001269,0.001269,0.000108,0.00045,0.001269,0.000131,0.000147,9.3e-05,0.001345,0.001269,0.000119,0.000906,0.001269,0.001269,0.001269,0.001269,0.001269,8.2e-05,8.6e-05,7.7e-05,6.3e-05,6.4e-05,5.4e-05,6.4e-05,6.7e-05,6.4e-05,4.8e-05,6.8e-05,6.7e-05,8.2e-05,8.6e-05,7.7e-05,6.3e-05,6.4e-05,5.4e-05,6.4e-05,6.7e-05,6.4e-05,4.8e-05,6.8e-05,6.7e-05,8.2e-05,0.000136,8.4e-05,6.3e-05,6.4e-05,0.000116,8.1e-05,6.7e-05,6.4e-05,0.000128,8.1e-05,6.7e-05,8.3e-05,9.6e-05,6.5e-05,9e-05,4.6e-05,7.2e-05,8.3e-05,7e-05,0.0001347722,0.000106,4.5e-05,7.6e-05,8.698968e-05,0.000107,4.947673e-05,7.7e-05,6.6e-05,8.6e-05,8.345294e-05,0.0001,8.7e-05,0.000121,8.7e-05,0.000121,8.2e-05,0.000108,8.2e-05,0.000109,7.3e-05,9.8e-05,7e-05,9.5e-05,7.5e-05,0.000101,0.000134,0.000116,0.000135,0.000126,0.000192,0.00013,0.000136,0.000127,0.000142,0.00013,0.000142,0.000129,0.000141,0.000131,8.2e-05,9.7e-05,9e-05,0.000114,6.7e-05,9.2e-05,8e-05,0.00011,6.7e-05,9.2e-05,6.5e-05,9e-05,8e-05,0.00011,0.000146,4.4e-05
cifar10,cifar100 [ood],0.001158,0.001002,0.001188,0.001341,0.00088,0.000814,0.00088,0.000902,0.00088,0.00086,0.000692,0.000902,0.000409,0.000337,0.000395,0.001375,0.000409,0.000477,0.000521,0.001148,0.000409,0.000577,0.000296,0.001148,0.000409,0.000273,0.000621,0.001886,0.0,0.0,0.0,0.0,0.0,0.001484,0.001271,0.0,0.000409,0.000378,0.000591,0.001886,0.0,0.001421,0.002037,0.0,0.0,0.0,0.0,0.0,0.000723,0.000599,0.000786,0.00098,0.00088,0.000814,0.00088,0.000902,0.00088,0.000866,0.000847,0.000902,0.000723,0.000599,0.000786,0.00098,0.00088,0.000814,0.00088,0.000902,0.00088,0.000866,0.000848,0.000902,0.000723,0.000686,0.000613,0.00098,0.00088,0.000859,0.000666,0.000902,0.00088,0.00086,0.000692,0.000902,0.000879,0.000753,0.00088,0.000841,0.001181,0.001,0.00104,0.000843,0.0006860007,0.000728,0.000391,0.00081,0.0006540548,0.000933,0.00079578,0.000914,0.000712,0.000851,0.0006703764,0.000899,0.000517,0.000915,0.000535,0.000819,0.000799,0.000984,0.000741,0.000898,0.000738,0.000868,0.000773,0.000843,0.000687,0.000849,0.000339,0.001014,0.000544,0.000846,0.000199,0.001188,0.000564,0.000863,0.000427,0.000799,0.000498,0.000831,0.000482,0.000778,0.000881,0.000775,0.000793,0.000728,0.000895,0.000864,0.000777,0.000776,0.000895,0.000864,0.00088,0.000841,0.000777,0.000777,0.001025,0.001507
cifar10,svhn [ood],0.002077,0.002252,0.001807,0.001607,0.003653,0.002954,0.003653,0.003592,0.003653,0.002197,0.00713,0.003592,0.010346,0.012131,0.010035,0.039171,0.010346,0.011168,0.009751,0.038295,0.010346,0.013197,0.009979,0.038295,0.010346,0.012631,0.010373,0.036733,0.0,0.0,0.0,0.0,0.0,0.014967,0.011891,0.0,0.010346,0.010352,0.010125,0.036733,0.0,0.014801,0.012439,0.0,0.0,0.0,0.0,0.0,0.005975,0.007015,0.005324,0.004545,0.003653,0.002954,0.003653,0.003592,0.003653,0.004611,0.004215,0.003592,0.005975,0.007015,0.005324,0.004545,0.003653,0.002954,0.003653,0.003592,0.003653,0.004611,0.004215,0.003592,0.005975,0.004311,0.007855,0.004545,0.003653,0.002444,0.007425,0.003592,0.003653,0.002197,0.00713,0.003592,0.003848,0.003398,0.00348,0.003078,0.002007,0.002571,0.004628,0.003762,0.004551587,0.004141,0.006073,0.004687,0.007121325,0.006087,0.005211242,0.004085,0.004132,0.003327,0.006025423,0.00498,0.008884,0.00751,0.008533,0.007191,0.006219,0.005221,0.006469,0.005476,0.004678,0.003826,0.004293,0.003571,0.005221,0.00423,0.013378,0.010772,0.010637,0.009714,0.014239,0.010762,0.011163,0.010169,0.010807,0.009673,0.009938,0.008956,0.010503,0.009535,0.004122,0.003615,0.005787,0.005208,0.004032,0.00351,0.005781,0.005174,0.004032,0.00351,0.00348,0.003078,0.005781,0.005174,0.0055,0.005441
cifar10,tiny_imagenet [ood],0.001202,0.001037,0.001218,0.001339,0.001008,0.000887,0.001008,0.001085,0.001008,0.000939,0.000688,0.001085,0.000264,0.000245,0.000304,0.002406,0.000264,0.000113,0.000563,0.002218,0.000264,0.000527,0.00051,0.002218,0.000265,0.000388,0.000569,0.002812,0.0,0.0,0.0,0.0,0.0,0.00158,0.000626,0.0,0.000265,0.000321,0.000451,0.002812,0.0,0.001478,0.001358,0.0,0.0,0.0,0.0,0.0,0.000781,0.000583,0.000857,0.001086,0.001008,0.000887,0.001008,0.001085,0.001008,0.000841,0.000954,0.001085,0.000781,0.000583,0.000857,0.001086,0.001008,0.000887,0.001008,0.001085,0.001008,0.000841,0.000954,0.001085,0.000781,0.000809,0.000597,0.001086,0.001008,0.000949,0.000651,0.001085,0.001008,0.000939,0.000688,0.001085,0.001022,0.000638,0.001024,0.000674,0.001225,0.00081,0.001149,0.000644,0.0008777427,0.000669,0.000431,0.000388,0.0006143688,0.000641,0.0008137545,0.000615,0.000782,0.000604,0.0006413942,0.00062,0.000464,0.000565,0.000522,0.000477,0.000784,0.000661,0.000747,0.000576,0.000826,0.000586,0.00091,0.000607,0.00075,0.000545,0.000338,0.000727,0.000231,0.000672,0.000635,0.001028,0.000232,0.000694,0.000273,0.000569,0.00027,0.000645,0.000269,0.000605,0.001016,0.00064,0.000862,0.000532,0.001005,0.000661,0.000848,0.000548,0.001005,0.000661,0.001025,0.000674,0.000848,0.000549,0.001501,0.001056
cifar100,cifar10 [ood],0.002073,0.002164,0.001835,0.001594,0.001566,0.001926,0.001566,0.001321,0.001566,0.001843,0.001232,0.001321,0.001959,0.001497,0.002057,0.002313,0.001959,0.001248,0.002236,0.001753,0.001959,0.001827,0.002041,0.001753,0.001959,0.001507,0.001932,0.002702,0.0,0.0,0.0,0.0,0.0,0.0051,0.001812,0.0,0.001959,0.001183,0.002035,0.002702,0.0,0.004693,0.001112,0.0,0.0,0.0,0.0,0.0,0.000933,0.001598,0.001444,0.001276,0.001566,0.001926,0.001566,0.001321,0.001566,0.00192,0.001444,0.001321,0.000933,0.001598,0.001444,0.001276,0.001566,0.001926,0.001566,0.001321,0.001566,0.00192,0.001444,0.001321,0.000933,0.001549,0.001331,0.001276,0.001566,0.00183,0.001125,0.001321,0.001566,0.001843,0.001232,0.001321,0.001554,0.001319,0.001577,0.001369,0.00189,0.001714,0.001487,0.001493,0.001464561,0.00112,0.00107,0.001378,0.001084814,0.000912,0.001393048,0.000826,0.00153,0.001048,0.001190779,0.000902,0.000966,0.001637,0.001557,0.00191,0.001014,0.00173,0.000823,0.001313,0.00082,0.001544,0.000959,0.001519,0.00085,0.001445,0.002152,0.00209,0.002299,0.0022,0.001377,0.002698,0.002211,0.00214,0.001984,0.001894,0.002122,0.002104,0.002176,0.002044,0.001538,0.001285,0.001256,0.00097,0.001538,0.001309,0.001308,0.001011,0.001538,0.001309,0.001577,0.001369,0.001308,0.001011,0.003064,0.004189
cifar100,cifar100 [miscls],0.002891,0.002761,0.002897,0.002921,0.002871,0.002655,0.002871,0.003251,0.002871,0.002267,0.001487,0.003251,0.004912,0.002878,0.00316,0.003847,0.004912,0.002173,0.002656,0.003371,0.004912,0.002725,0.003271,0.003371,0.004913,0.003234,0.003902,0.006039,0.0,0.0,0.0,0.0,0.0,0.005075,0.0051,0.0,0.004913,0.002852,0.002498,0.006039,0.0,0.004444,0.003812,0.0,0.0,0.0,0.0,0.0,0.002852,0.002791,0.002701,0.00263,0.002871,0.002655,0.002871,0.003251,0.002871,0.002832,0.002746,0.003251,0.002852,0.002791,0.002701,0.00263,0.002871,0.002655,0.002871,0.003251,0.002871,0.002832,0.002746,0.003251,0.002852,0.002288,0.001515,0.00263,0.002871,0.002302,0.001524,0.003251,0.002871,0.002267,0.001487,0.003251,0.002558,0.002803,0.002922,0.003172,0.002831,0.002932,0.001854,0.002499,0.002086905,0.002537,0.003013,0.003435,0.00270345,0.002785,0.002941403,0.003083,0.002617,0.002861,0.002785602,0.002915,0.002736,0.002411,0.001859,0.00192,0.001939,0.002597,0.002099,0.002639,0.002686,0.003154,0.002952,0.003353,0.002584,0.003041,0.005891,0.004825,0.004243,0.003993,0.004383,0.00408,0.004399,0.004264,0.003319,0.002863,0.003003,0.002701,0.003541,0.003325,0.002574,0.002814,0.002345,0.002751,0.002947,0.003175,0.002733,0.003054,0.002947,0.003175,0.002922,0.003172,0.002733,0.003054,0.00312,0.006341
cifar100,cifar100 [selective],0.00076,0.00089,0.000799,0.000806,0.000728,0.00087,0.000728,0.000647,0.000728,0.000898,0.000605,0.000647,0.002144,0.001027,0.001282,0.00328,0.002144,0.000896,0.001035,0.002569,0.002144,0.001139,0.001334,0.002569,0.002144,0.001146,0.001311,0.006193,0.000884,0.000884,0.000884,0.000884,0.000884,0.002695,0.002495,0.000884,0.002144,0.00103,0.001054,0.006193,0.000884,0.00245,0.001814,0.000884,0.000884,0.000884,0.000884,0.000884,0.00057,0.000848,0.000702,0.000654,0.000728,0.00087,0.000728,0.000646,0.000728,0.000869,0.000711,0.000646,0.000571,0.000848,0.000702,0.000654,0.000728,0.00087,0.000728,0.000647,0.000728,0.000869,0.000711,0.000647,0.000571,0.00081,0.000617,0.000654,0.000728,0.000833,0.000612,0.000647,0.000728,0.000898,0.000605,0.000647,0.00073,0.000726,0.000744,0.000781,0.00081,0.000813,0.000815,0.000976,0.0007646247,0.000528,0.000806,0.001089,0.0008153439,0.000745,0.000854814,0.000858,0.000824,0.000831,0.0008325231,0.000767,0.001196,0.000972,0.000841,0.000716,0.0005,0.000652,0.00053,0.00062,0.000635,0.000724,0.000689,0.000747,0.000627,0.000698,0.002285,0.002217,0.001658,0.001487,0.002299,0.002599,0.001809,0.001776,0.00119,0.001125,0.001096,0.000963,0.001441,0.001351,0.00073,0.000728,0.00069,0.00073,0.000746,0.000777,0.000723,0.000777,0.000746,0.000777,0.000744,0.000781,0.000723,0.000777,0.001494,0.001328
cifar100,svhn [ood],0.005678,0.006667,0.006101,0.00591,0.005974,0.006407,0.005974,0.00594,0.005974,0.00574,0.005786,0.00594,0.007283,0.013424,0.010449,0.010311,0.007283,0.012359,0.011076,0.010597,0.007283,0.015692,0.010267,0.010597,0.007283,0.014047,0.009214,0.006846,0.0,0.0,0.0,0.0,0.0,0.025653,0.007831,0.0,0.007283,0.011389,0.011355,0.006846,0.0,0.025129,0.007801,0.0,0.0,0.0,0.0,0.0,0.005105,0.005873,0.005756,0.005935,0.005974,0.006407,0.005974,0.00594,0.005974,0.006308,0.005898,0.00594,0.005105,0.005873,0.005756,0.005935,0.005974,0.006407,0.005974,0.00594,0.005974,0.006308,0.005898,0.00594,0.005105,0.005266,0.006252,0.005935,0.005974,0.005665,0.005712,0.00594,0.005974,0.00574,0.005786,0.00594,0.006032,0.004973,0.006055,0.005037,0.006061,0.004761,0.006801,0.006275,0.006349699,0.005977,0.007014,0.005599,0.007095612,0.006383,0.006474975,0.005723,0.006162,0.005316,0.006906452,0.006133,0.007238,0.010379,0.009144,0.012426,0.007802,0.007641,0.006803,0.007156,0.007749,0.00722,0.0077,0.007204,0.007354,0.007073,0.01376,0.01842,0.009045,0.011661,0.013972,0.021797,0.009033,0.011767,0.011361,0.013652,0.010836,0.012914,0.010348,0.012592,0.006009,0.005013,0.005682,0.005161,0.006037,0.005079,0.005888,0.005208,0.006037,0.005079,0.006055,0.005037,0.005888,0.005208,0.032894,0.033548
cifar100,tiny_imagenet [ood],0.000841,0.000847,0.000601,0.00048,0.001409,0.000946,0.001409,0.002107,0.001409,0.000167,1.6e-05,0.002107,0.00278,3.8e-05,0.001059,0.002002,0.00278,9e-06,0.000746,0.001644,0.00278,4e-05,0.001207,0.001644,0.00278,7.7e-05,0.001896,0.003374,0.0,0.0,0.0,0.0,0.0,0.000511,0.002741,0.0,0.00278,9.9e-05,0.000216,0.003374,0.0,6.9e-05,0.000803,0.0,0.0,0.0,0.0,0.0,5.3e-05,4e-06,0.000764,0.001243,0.001409,0.000946,0.001409,0.002107,0.001409,0.000964,0.001161,0.002107,5.3e-05,4e-06,0.000764,0.001243,0.001409,0.000946,0.001409,0.002107,0.001409,0.000964,0.001161,0.002107,5.3e-05,9e-06,7e-06,0.001243,0.001409,8.3e-05,3e-05,0.002107,0.001409,0.000167,1.6e-05,0.002107,0.001174,0.001171,0.001429,0.001467,0.000652,0.000515,4e-06,4e-06,8.99424e-07,7e-06,2.5e-05,2.3e-05,5.486844e-07,4e-06,4.594368e-07,2e-06,1.7e-05,3.4e-05,1.702924e-07,2e-06,0.000531,0.000562,9.5e-05,0.000302,0.000126,0.000224,8e-06,2.8e-05,2.4e-05,0.000114,0.000228,0.000364,1.8e-05,0.000117,0.000191,0.000209,0.00171,0.001856,0.001402,0.001485,0.002542,0.002601,0.000706,0.00082,0.00074,0.000834,0.001206,0.001292,0.000497,0.000885,1.7e-05,2.6e-05,0.00151,0.001393,1.9e-05,4.2e-05,0.00151,0.001393,0.001429,0.001467,1.9e-05,4.2e-05,0.003721,0.005384


In [8]:
from configs.interesting_compositions import INTERESTING_COMPOSITIONS

for k in INTERESTING_COMPOSITIONS.keys():
    print(k)

COMPOSITE BAYES ALL OUTER
COMPOSITE BAYES ALL INNER
COMPOSITE BAYES ALL CENTRAL
COMPOSITE BAYES ALL OUTER + M
COMPOSITE BAYES ALL INNER + M
COMPOSITE BAYES ALL CENTRAL + M
COMPOSITE EXCESS ALL OUTER OUTER
COMPOSITE EXCESS ALL OUTER INNER
COMPOSITE EXCESS ALL OUTER CENTRAL
COMPOSITE EXCESS ALL INNER OUTER
COMPOSITE EXCESS ALL INNER CENTRAL
COMPOSITE EXCESS ALL CENTRAL OUTER
COMPOSITE EXCESS ALL CENTRAL INNER
COMPOSITE EXCESS ALL OUTER OUTER + M
COMPOSITE EXCESS ALL OUTER INNER + M
COMPOSITE EXCESS ALL OUTER CENTRAL + M
COMPOSITE EXCESS ALL INNER OUTER + M
COMPOSITE EXCESS ALL INNER CENTRAL + M
COMPOSITE EXCESS ALL CENTRAL OUTER + M
COMPOSITE EXCESS ALL CENTRAL INNER + M
COMPOSITE EAT LOGSCORE OUTER OUTER
COMPOSITE EAT LOGSCORE OUTER INNER
COMPOSITE EAT LOGSCORE OUTER CENTRAL
COMPOSITE EAT LOGSCORE INNER OUTER
COMPOSITE EAT LOGSCORE INNER CENTRAL
COMPOSITE EAT LOGSCORE CENTRAL OUTER
COMPOSITE EAT LOGSCORE CENTRAL INNER
COMPOSITE EAT LOGSCORE OUTER OUTER + M
COMPOSITE EAT LOGSCORE OUTER I

In [9]:
measure_name = "COMPOSITE EAT LOGSCORE OUTER OUTER + M"
res_df = select_composite_and_components(transformed_df, measure_name)
res_df_std = select_composite_and_components(std_df, measure_name)

res_df_with_dominance = check_composite_dominance(res_df)

composite_pareto_results = analyze_composite_pareto_performance(
    transformed_df, INTERESTING_COMPOSITIONS, do_for_each_measure=True, different_only=False
)

In [10]:
composite_pareto_results

{'COMPOSITE BAYES ALL OUTER': {'pareto_count': 36,
  'total_problems': 105,
  'pareto_percentage': 34.285714285714285,
  'average_pareto_depth': np.float64(0.8476190476190476),
  'median_pareto_depth': np.float64(1.0),
  'individual_measures': {'R_b 1 (Logscore)': {'pareto_count': 85,
    'total_problems': 105,
    'pareto_percentage': 80.95238095238095,
    'average_pareto_depth': np.float64(0.44761904761904764),
    'median_pareto_depth': np.float64(0.0)},
   'R_b 1 (Brier)': {'pareto_count': 64,
    'total_problems': 105,
    'pareto_percentage': 60.952380952380956,
    'average_pareto_depth': np.float64(0.8285714285714286),
    'median_pareto_depth': np.float64(0.0)},
   'R_b 1 (Spherical)': {'pareto_count': 54,
    'total_problems': 105,
    'pareto_percentage': 51.42857142857142,
    'average_pareto_depth': np.float64(0.6476190476190476),
    'median_pareto_depth': np.float64(0.0)},
   'R_b 1 (Zero-one)': {'pareto_count': 31,
    'total_problems': 105,
    'pareto_percentage': 29

In [11]:
display(res_df_with_dominance)
display(res_df_std)

print("==" * 100)
print("Pareto Percentages:")

for k, result in composite_pareto_results.items():
    if measure_name == k:
        indv_ = result['individual_measures']
        print(measure_name, result['pareto_percentage'])
        for name, el in indv_.items():
            print(name, el['pareto_percentage'])

Unnamed: 0_level_0,measure,R_e 1 1 (Logscore),R_t 1 1 (Logscore),R_b 1 (Logscore),mahalanobis,composite eat logscore outer outer + m,if_dominates_100%,if_dominates_75%,if_dominates_50%,beats_worst_component
ind_dataset,eval,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
cifar10,cifar10 [miscls],0.94043,0.943244,0.942267,0.927621,0.943972,True,True,True,True
cifar10,cifar10 [selective],0.996843,0.996864,0.996818,0.996266,0.996923,True,True,True,True
cifar10,cifar100 [ood],0.90473,0.911507,0.916906,0.912238,0.917981,True,True,True,True
cifar10,svhn [ood],0.942616,0.956506,0.962992,0.934311,0.957479,False,True,True,True
cifar10,tiny_imagenet [ood],0.895731,0.903615,0.911364,0.910273,0.912092,True,True,True,True
cifar100,cifar10 [ood],0.724548,0.774023,0.77327,0.534822,0.76479,False,False,True,True
cifar100,cifar100 [miscls],0.818006,0.853064,0.845094,0.573908,0.849159,False,True,True,True
cifar100,cifar100 [selective],0.909667,0.918425,0.915943,0.81055,0.915536,False,False,True,True
cifar100,svhn [ood],0.755848,0.867727,0.87012,0.678832,0.870357,True,True,True,True
cifar100,tiny_imagenet [ood],0.999852,0.999997,0.809888,0.622941,0.999998,True,True,True,True


Unnamed: 0_level_0,Unnamed: 1_level_0,R_e 1 1 (Logscore),R_t 1 1 (Logscore),R_b 1 (Logscore),mahalanobis,composite eat logscore outer outer + m
ind_dataset,eval,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
cifar10,cifar10 [miscls],0.003253,0.002413,0.001585,0.002597,0.001925
cifar10,cifar10 [selective],0.000145,8.6e-05,4.9e-05,4.4e-05,0.0001
cifar10,cifar100 [ood],0.000337,0.000599,0.001002,0.001507,0.000899
cifar10,svhn [ood],0.012131,0.007015,0.002252,0.005441,0.00498
cifar10,tiny_imagenet [ood],0.000245,0.000583,0.001037,0.001056,0.00062
cifar100,cifar10 [ood],0.001497,0.001598,0.002164,0.004189,0.000902
cifar100,cifar100 [miscls],0.002878,0.002791,0.002761,0.006341,0.002915
cifar100,cifar100 [selective],0.001027,0.000848,0.00089,0.001328,0.000767
cifar100,svhn [ood],0.013424,0.005873,0.006667,0.033548,0.006133
cifar100,tiny_imagenet [ood],3.8e-05,4e-06,0.000847,0.005384,2e-06


Pareto Percentages:
COMPOSITE EAT LOGSCORE OUTER OUTER + M 82.85714285714286
R_e 1 1 (Logscore) 0.0
R_t 1 1 (Logscore) 65.71428571428571
R_b 1 (Logscore) 21.904761904761905
mahalanobis 0.0


In [12]:
# assume your df has MultiIndex with level names ['ind_dataset', 'eval']
lvl = res_df_with_dominance.index.get_level_values('eval')

df_ood       = res_df_with_dominance[lvl.str.contains(r'\[ood\]')]
df_miscls    = res_df_with_dominance[lvl.str.contains(r'\[miscls\]')]
df_selective = res_df_with_dominance[lvl.str.contains(r'\[selective\]')]

# assume your df has MultiIndex with level names ['ind_dataset', 'eval']
lvl_std = res_df_std.index.get_level_values('eval')

df_ood_std       = res_df_std[lvl_std.str.contains(r'\[ood\]')]
df_miscls_std    = res_df_std[lvl_std.str.contains(r'\[miscls\]')]
df_selective_std = res_df_std[lvl_std.str.contains(r'\[selective\]')]

df_ood = df_ood.drop(columns=['if_dominates_100%', 'if_dominates_75%', 'if_dominates_50%',
       'beats_worst_component'])

df_miscls = df_miscls.drop(columns=['if_dominates_100%', 'if_dominates_75%', 'if_dominates_50%',
       'beats_worst_component'])

df_selective = df_selective.drop(columns=['if_dominates_100%', 'if_dominates_75%', 'if_dominates_50%',
    'beats_worst_component'])

In [13]:
col_order = ["composite eat logscore outer outer + m", "R_e 1 1 (Logscore)", "R_t 1 1 (Logscore)", "R_b 1 (Logscore)", "mahalanobis"]

In [14]:
df_ood = with_avg_row(df_ood, label=("AVG", "[all rows]"))[col_order]
df_ood_std = with_avg_row(df_ood_std, label=("AVG", "[all rows]"))[col_order]

latex_df = mean_pm_std(df_mean=df_ood, df_std=df_ood_std, )
latex_table = latex_df.to_latex(escape=False)
print(latex_table)

\begin{tabular}{lllllll}
\toprule
 &  & composite eat logscore outer outer + m & R_e 1 1 (Logscore) & R_t 1 1 (Logscore) & R_b 1 (Logscore) & mahalanobis \\
ind_dataset & eval &  &  &  &  &  \\
\midrule
\multirow[t]{3}{*}{cifar10} & cifar100 [ood] & $0.918 \pm 0.001$ & $0.905 \pm 0.000$ & $0.912 \pm 0.001$ & $0.917 \pm 0.001$ & $0.912 \pm 0.002$ \\
 & svhn [ood] & $0.957 \pm 0.005$ & $0.943 \pm 0.012$ & $0.957 \pm 0.007$ & $0.963 \pm 0.002$ & $0.934 \pm 0.005$ \\
 & tiny_imagenet [ood] & $0.912 \pm 0.001$ & $0.896 \pm 0.000$ & $0.904 \pm 0.001$ & $0.911 \pm 0.001$ & $0.910 \pm 0.001$ \\
\cline{1-7}
\multirow[t]{3}{*}{cifar100} & cifar10 [ood] & $0.765 \pm 0.001$ & $0.725 \pm 0.001$ & $0.774 \pm 0.002$ & $0.773 \pm 0.002$ & $0.535 \pm 0.004$ \\
 & svhn [ood] & $0.870 \pm 0.006$ & $0.756 \pm 0.013$ & $0.868 \pm 0.006$ & $0.870 \pm 0.007$ & $0.679 \pm 0.034$ \\
 & tiny_imagenet [ood] & $1.000 \pm 0.000$ & $1.000 \pm 0.000$ & $1.000 \pm 0.000$ & $0.810 \pm 0.001$ & $0.623 \pm 0.005$ \\
\cl

In [15]:
df_miscls = with_avg_row(df_miscls, label=("AVG", "[all rows]"))[col_order]
df_miscls_std = with_avg_row(df_miscls_std, label=("AVG", "[all rows]"))[col_order]

latex_df = fmt_valvar(df_miscls, df_miscls_std, mean_decimals=3, std_decimals=3, bold=False, underline=False)
latex_table = latex_df.to_latex(escape=False)
print(latex_table)

\begin{tabular}{lllllll}
\toprule
 & measure & composite eat logscore outer outer + m & R_e 1 1 (Logscore) & R_t 1 1 (Logscore) & R_b 1 (Logscore) & mahalanobis \\
ind_dataset & eval &  &  &  &  &  \\
\midrule
cifar10 & cifar10 [miscls] & \valvar{0.944}{.002} & \valvar{0.940}{.003} & \valvar{0.943}{.002} & \valvar{0.942}{.002} & \valvar{0.928}{.003} \\
\cline{1-7}
cifar100 & cifar100 [miscls] & \valvar{0.849}{.003} & \valvar{0.818}{.003} & \valvar{0.853}{.003} & \valvar{0.845}{.003} & \valvar{0.574}{.006} \\
\cline{1-7}
tiny_imagenet & tiny_imagenet [miscls] & \valvar{0.847}{.002} & \valvar{0.813}{.001} & \valvar{0.851}{.002} & \valvar{0.845}{.003} & \valvar{0.417}{.004} \\
\cline{1-7}
AVG & [all rows] & \valvar{0.880}{.002} & \valvar{0.857}{.002} & \valvar{0.882}{.002} & \valvar{0.877}{.002} & \valvar{0.639}{.004} \\
\cline{1-7}
\bottomrule
\end{tabular}



In [16]:
df_selective = with_avg_row(df_selective, label=("AVG", "[all rows]"))[col_order]
df_selective_std = with_avg_row(df_selective_std, label=("AVG", "[all rows]"))[col_order]

latex_df = fmt_valvar(df_selective, df_selective_std, mean_decimals=3, std_decimals=3, bold=False, underline=False)
latex_table = latex_df.to_latex(escape=False)
print(latex_table)

\begin{tabular}{lllllll}
\toprule
 & measure & composite eat logscore outer outer + m & R_e 1 1 (Logscore) & R_t 1 1 (Logscore) & R_b 1 (Logscore) & mahalanobis \\
ind_dataset & eval &  &  &  &  &  \\
\midrule
cifar10 & cifar10 [selective] & \valvar{0.997}{.000} & \valvar{0.997}{.000} & \valvar{0.997}{.000} & \valvar{0.997}{.000} & \valvar{0.996}{.000} \\
\cline{1-7}
cifar100 & cifar100 [selective] & \valvar{0.916}{.001} & \valvar{0.910}{.001} & \valvar{0.918}{.001} & \valvar{0.916}{.001} & \valvar{0.811}{.001} \\
\cline{1-7}
tiny_imagenet & tiny_imagenet [selective] & \valvar{0.886}{.001} & \valvar{0.879}{.001} & \valvar{0.891}{.000} & \valvar{0.889}{.001} & \valvar{0.660}{.005} \\
\cline{1-7}
AVG & [all rows] & \valvar{0.933}{.001} & \valvar{0.929}{.001} & \valvar{0.935}{.000} & \valvar{0.934}{.001} & \valvar{0.822}{.002} \\
\cline{1-7}
\bottomrule
\end{tabular}



In [17]:
import pandas as pd
import numpy as np

def highlight_best_and_second(s, best="#27ef56", second="#3908ed"):
    # rank 1 = largest; ties share the same rank
    r = s.rank(method="min", ascending=False)
    out = []
    for val, ri in zip(s, r):
        if pd.isna(val):
            out.append("")
        elif ri == 1:
            out.append(f"background-color: {best}; font-weight: bold")
        elif ri == 2:
            out.append(f"background-color: {second}")
        else:
            out.append("")
    return out


In [18]:
[el for el in transformed_df.columns]

['R_b 1 (Brier)',
 'R_b 1 (Logscore)',
 'R_b 1 (Spherical)',
 'R_b 1 (Zero-one)',
 'R_b 2 (Brier)',
 'R_b 2 (Logscore)',
 'R_b 2 (Spherical)',
 'R_b 2 (Zero-one)',
 'R_b 3 (Brier)',
 'R_b 3 (Logscore)',
 'R_b 3 (Spherical)',
 'R_b 3 (Zero-one)',
 'R_e 1 1 (Brier)',
 'R_e 1 1 (Logscore)',
 'R_e 1 1 (Spherical)',
 'R_e 1 1 (Zero-one)',
 'R_e 1 2 (Brier)',
 'R_e 1 2 (Logscore)',
 'R_e 1 2 (Spherical)',
 'R_e 1 2 (Zero-one)',
 'R_e 1 3 (Brier)',
 'R_e 1 3 (Logscore)',
 'R_e 1 3 (Spherical)',
 'R_e 1 3 (Zero-one)',
 'R_e 2 1 (Brier)',
 'R_e 2 1 (Logscore)',
 'R_e 2 1 (Spherical)',
 'R_e 2 1 (Zero-one)',
 'R_e 2 2 (Brier)',
 'R_e 2 2 (Logscore)',
 'R_e 2 2 (Spherical)',
 'R_e 2 2 (Zero-one)',
 'R_e 2 3 (Brier)',
 'R_e 2 3 (Logscore)',
 'R_e 2 3 (Spherical)',
 'R_e 2 3 (Zero-one)',
 'R_e 3 1 (Brier)',
 'R_e 3 1 (Logscore)',
 'R_e 3 1 (Spherical)',
 'R_e 3 1 (Zero-one)',
 'R_e 3 2 (Brier)',
 'R_e 3 2 (Logscore)',
 'R_e 3 2 (Spherical)',
 'R_e 3 2 (Zero-one)',
 'R_e 3 3 (Brier)',
 'R_e 3 3 (Log

In [30]:
# col_order = ['composite bayes all outer', 'R_b 1 (Logscore)', 'R_b 1 (Brier)', 'R_b 1 (Spherical)', 'R_b 1 (Zero-one)']
col_order = ['composite excess all outer outer', 'R_e 1 1 (Logscore)', 'R_e 1 1 (Brier)', 'R_e 1 1 (Spherical)', 'R_e 1 1 (Zero-one)']
transformed_df[col_order].style.apply(highlight_best_and_second, axis=1)

Unnamed: 0_level_0,measure,composite excess all outer outer,R_e 1 1 (Logscore),R_e 1 1 (Brier),R_e 1 1 (Spherical),R_e 1 1 (Zero-one)
ind_dataset,eval,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
cifar10,cifar10 [miscls],0.942233,0.94043,0.942366,0.943107,0.798849
cifar10,cifar10 [selective],0.996911,0.996843,0.996913,0.996936,0.98468
cifar10,cifar100 [ood],0.904362,0.90473,0.902342,0.904375,0.753831
cifar10,svhn [ood],0.94191,0.942616,0.940173,0.941999,0.82336
cifar10,tiny_imagenet [ood],0.895476,0.895731,0.893229,0.895592,0.751893
cifar100,cifar10 [ood],0.709955,0.724548,0.681292,0.717172,0.675933
cifar100,cifar100 [miscls],0.817947,0.818006,0.782572,0.82975,0.785608
cifar100,cifar100 [selective],0.910254,0.909667,0.899957,0.914149,0.880184
cifar100,svhn [ood],0.715296,0.755848,0.662081,0.723351,0.679433
cifar100,tiny_imagenet [ood],0.994084,0.999852,0.953406,0.991516,0.973368


In [31]:
# col_order = ['composite bayes all inner', 'R_b 2 (Logscore)', 'R_b 2 (Brier)', 'R_b 2 (Spherical)', 'R_b 2 (Zero-one)']
col_order = ['composite excess all outer inner', 'R_e 1 2 (Logscore)', 'R_e 1 2 (Brier)', 'R_e 1 2 (Spherical)', 'R_e 1 2 (Zero-one)']
transformed_df[col_order].style.apply(highlight_best_and_second, axis=1)

Unnamed: 0_level_0,measure,composite excess all outer inner,R_e 1 2 (Logscore),R_e 1 2 (Brier),R_e 1 2 (Spherical),R_e 1 2 (Zero-one)
ind_dataset,eval,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
cifar10,cifar10 [miscls],0.942911,0.941645,0.942365,0.941898,0.796675
cifar10,cifar10 [selective],0.996933,0.996886,0.996913,0.996698,0.982762
cifar10,cifar100 [ood],0.905259,0.907203,0.902342,0.902404,0.754648
cifar10,svhn [ood],0.943061,0.945786,0.940173,0.942129,0.824603
cifar10,tiny_imagenet [ood],0.896608,0.898685,0.893229,0.893123,0.752376
cifar100,cifar10 [ood],0.717831,0.736746,0.681292,0.72158,0.689059
cifar100,cifar100 [miscls],0.828895,0.831543,0.782572,0.83724,0.806319
cifar100,cifar100 [selective],0.913108,0.913284,0.899957,0.916155,0.878853
cifar100,svhn [ood],0.730109,0.77634,0.662081,0.731242,0.705718
cifar100,tiny_imagenet [ood],0.995336,0.999942,0.953406,0.994416,0.976322


In [32]:
# col_order = ['composite bayes all central', 'R_b 3 (Logscore)', 'R_b 3 (Brier)', 'R_b 3 (Spherical)', 'R_b 3 (Zero-one)']
col_order = ['composite excess all outer central', 'R_e 1 3 (Logscore)', 'R_e 1 3 (Brier)', 'R_e 1 3 (Spherical)', 'R_e 1 3 (Zero-one)']
transformed_df[col_order].style.apply(highlight_best_and_second, axis=1)

Unnamed: 0_level_0,measure,composite excess all outer central,R_e 1 3 (Logscore),R_e 1 3 (Brier),R_e 1 3 (Spherical),R_e 1 3 (Zero-one)
ind_dataset,eval,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
cifar10,cifar10 [miscls],0.941534,0.936452,0.942365,0.942409,0.796675
cifar10,cifar10 [selective],0.996881,0.996693,0.996913,0.996769,0.982762
cifar10,cifar100 [ood],0.903889,0.902604,0.902342,0.903989,0.754648
cifar10,svhn [ood],0.941313,0.939684,0.940173,0.941816,0.824603
cifar10,tiny_imagenet [ood],0.895018,0.893504,0.893229,0.894407,0.752376
cifar100,cifar10 [ood],0.710276,0.718033,0.681292,0.714663,0.689059
cifar100,cifar100 [miscls],0.819044,0.8042,0.782572,0.827383,0.806319
cifar100,cifar100 [selective],0.910219,0.90564,0.899957,0.913539,0.878853
cifar100,svhn [ood],0.717968,0.749942,0.662081,0.718591,0.705718
cifar100,tiny_imagenet [ood],0.995487,0.9999,0.953406,0.989533,0.976322


In [36]:
# col_order = ['composite bayes all outer', 'R_b 1 (Logscore)', 'R_b 1 (Brier)', 'R_b 1 (Spherical)', 'R_b 1 (Zero-one)']
col_order = ['composite excess all outer central', 'R_e 1 3 (Logscore)', 'R_e 1 3 (Brier)', 'R_e 1 3 (Spherical)', 'R_e 1 3 (Zero-one)']
latex_df = mean_pm_std(
    df_mean=with_avg_row(transformed_df[col_order], label=("AVG", "[all rows]"))[col_order],
    df_std=with_avg_row(std_df[col_order], label=("AVG", "[all rows]"))[col_order], )
latex_table = latex_df.to_latex(escape=False)
print(latex_table)

\begin{tabular}{lllllll}
\toprule
 &  & composite excess all outer central & R_e 1 3 (Logscore) & R_e 1 3 (Brier) & R_e 1 3 (Spherical) & R_e 1 3 (Zero-one) \\
ind_dataset & eval &  &  &  &  &  \\
\midrule
\multirow[t]{5}{*}{cifar10} & cifar10 [miscls] & $0.942 \pm 0.003$ & $0.936 \pm 0.003$ & $0.942 \pm 0.003$ & $0.942 \pm 0.003$ & $0.797 \pm 0.008$ \\
 & cifar10 [selective] & $0.997 \pm 0.000$ & $0.997 \pm 0.000$ & $0.997 \pm 0.000$ & $0.997 \pm 0.000$ & $0.983 \pm 0.002$ \\
 & cifar100 [ood] & $0.904 \pm 0.000$ & $0.903 \pm 0.001$ & $0.902 \pm 0.000$ & $0.904 \pm 0.000$ & $0.755 \pm 0.001$ \\
 & svhn [ood] & $0.941 \pm 0.011$ & $0.940 \pm 0.013$ & $0.940 \pm 0.010$ & $0.942 \pm 0.010$ & $0.825 \pm 0.038$ \\
 & tiny_imagenet [ood] & $0.895 \pm 0.000$ & $0.894 \pm 0.001$ & $0.893 \pm 0.000$ & $0.894 \pm 0.001$ & $0.752 \pm 0.002$ \\
\cline{1-7}
\multirow[t]{5}{*}{cifar100} & cifar10 [ood] & $0.710 \pm 0.002$ & $0.718 \pm 0.002$ & $0.681 \pm 0.002$ & $0.715 \pm 0.002$ & $0.689 \pm 0.00

In [24]:
transformed_df[col_order].style.apply(highlight_best_and_second, axis=1)

Unnamed: 0_level_0,measure,composite bayes all outer,R_b 1 (Logscore),R_b 1 (Brier),R_b 1 (Spherical),R_b 1 (Zero-one)
ind_dataset,eval,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
cifar10,cifar10 [miscls],0.942215,0.942267,0.942466,0.942228,0.941776
cifar10,cifar10 [selective],0.996821,0.996818,0.996836,0.996827,0.99681
cifar10,cifar100 [ood],0.914757,0.916906,0.914436,0.914506,0.913191
cifar10,svhn [ood],0.959149,0.962992,0.958357,0.95853,0.956294
cifar10,tiny_imagenet [ood],0.908978,0.911364,0.908611,0.908679,0.90721
cifar100,cifar10 [ood],0.77331,0.77327,0.773,0.773388,0.772177
cifar100,cifar100 [miscls],0.855261,0.845094,0.857773,0.856181,0.858986
cifar100,cifar100 [selective],0.919374,0.915943,0.920203,0.919719,0.920576
cifar100,svhn [ood],0.861924,0.87012,0.858293,0.86097,0.855937
cifar100,tiny_imagenet [ood],0.80281,0.809888,0.789521,0.806267,0.803022


In [25]:
transformed_df[col_order].style.apply(highlight_best_and_second, axis=1)

Unnamed: 0_level_0,measure,composite bayes all outer,R_b 1 (Logscore),R_b 1 (Brier),R_b 1 (Spherical),R_b 1 (Zero-one)
ind_dataset,eval,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
cifar10,cifar10 [miscls],0.942215,0.942267,0.942466,0.942228,0.941776
cifar10,cifar10 [selective],0.996821,0.996818,0.996836,0.996827,0.99681
cifar10,cifar100 [ood],0.914757,0.916906,0.914436,0.914506,0.913191
cifar10,svhn [ood],0.959149,0.962992,0.958357,0.95853,0.956294
cifar10,tiny_imagenet [ood],0.908978,0.911364,0.908611,0.908679,0.90721
cifar100,cifar10 [ood],0.77331,0.77327,0.773,0.773388,0.772177
cifar100,cifar100 [miscls],0.855261,0.845094,0.857773,0.856181,0.858986
cifar100,cifar100 [selective],0.919374,0.915943,0.920203,0.919719,0.920576
cifar100,svhn [ood],0.861924,0.87012,0.858293,0.86097,0.855937
cifar100,tiny_imagenet [ood],0.80281,0.809888,0.789521,0.806267,0.803022
