In [1]:
import pandas as pd
import itertools
import os

In [2]:
pd.options.display.float_format = "{:,.3f}".format

### Globals, Helper Functions, etc

In [3]:
MEASURE_NAME_DICT = {
    "AlignedCosineSimilarity": "AlignCos",
    "CKA": "CKA",
    "ConcentricityDifference": "ConcDiff",
    "DistanceCorrelation": "DistCorr",
    "EigenspaceOverlapScore": "EOS",
    "GeometryScore": "GS",
    "Gulp": "GULP",
    "HardCorrelationMatch": "HardCorr",
    "IMDScore": "IMD",
    "JaccardSimilarity": "Jaccard",
    "LinearRegression": "LinReg",
    "MagnitudeDifference": "MagDiff",
    "OrthogonalAngularShapeMetricCentered": "ShapeMet",
    "OrthogonalProcrustesCenteredAndNormalized": "OrthProc",
    "PWCCA": "PWCCA",
    "PermutationProcrustes": "PermProc",
    "ProcrustesSizeAndShapeDistance": "ProcDist",
    "RSA": "RSA",
    "RSMNormDifference": "RSMDiff",
    "RankSimilarity": "RankSim",
    "SVCCA": "SVCCA",
    "SecondOrderCosineSimilarity": "2nd-Cos",
    "SoftCorrelationMatch": "SoftCorr",
    "UniformityDifference": "UnifDiff",
}

PIVOT_COL_DICT = {
    "cora": "Cora",
    "flickr": "Flickr",
    "ogbn-arxiv": "OGBN-Arxiv",
    "GraphSAGE": "SAGE",
    "violation_rate": "Violation Rate",
    "correlation": "Spearman Correlation"
}

COLUMN_NAME_DICT = {
    "similarity_measure": "Similarity Measure", 
    "quality_measure": "Measure",
    "functional_similarity_measure": "Measure",
    "architecture": "Model",
    "representation_dataset": "Dataset"
}

LATEX_FORMAT_DICT = {
    "float_format": "%.2f", 
    "column_format": "l||rrr|rrr|rrr||rrr|rrr|rrr",
    "multicolumn_format": "c",
    "index_names": False,
}

In [4]:
EXPERIMENT_RESULTS_PATH = 'C:/Users/Tobias/Eigene Dokumente/Research/similaritybench/experiments/results/full_csvs'
COMPARISON_TYPE_DICT = {
    "label_test": "group_separation",
    "layer_test": "monotonicity",
    "augmentation_test": "group_separation",
    "shortcut_test": "group_separation"
}

EXPERIMENTS = list(COMPARISON_TYPE_DICT.keys())
DATASETS = ["cora", "flickr", "ogbn-arxiv"]
ARCHITECTURES = ["GCN", "GraphSAGE", "GAT"]

def FULL_DF_FILE_NAME(experiment, comparison_type, dataset, groups=5):
    if groups < 5:
        return f"{experiment}_{comparison_type}_{dataset}_{groups}groups_full.csv"
    return f"{experiment}_{comparison_type}_{dataset}_full.csv"

In [5]:
def get_pivot_table(experiment, dataset):
    path = os.path.join(EXPERIMENT_RESULTS_PATH, FULL_DF_FILE_NAME(experiment, COMPARISON_TYPE_DICT[experiment], dataset))
    
    df = pd.read_csv(path)
    data = df.loc[:, ["similarity_measure", "quality_measure", "value", "architecture", "representation_dataset"]]
    return data.pivot(index="similarity_measure", columns=["representation_dataset", "architecture", "quality_measure"], values="value")

In [6]:
def get_agg_pivot_table(experiment, datasets, groups=5):
    dfs = []
    for dataset in datasets:
        path = os.path.join(EXPERIMENT_RESULTS_PATH, FULL_DF_FILE_NAME(experiment, COMPARISON_TYPE_DICT[experiment], dataset, groups))
        df = pd.read_csv(path)
        data = df.loc[:, ["similarity_measure", "quality_measure", "value", "architecture", "representation_dataset"]].dropna()
   
        data = data.rename(COLUMN_NAME_DICT, axis="columns")
        dfs.append(data.iloc[:])
    df_cc = pd.concat(dfs, axis=0)
    df_res = df_cc.pivot_table(index="Similarity Measure", columns=["Measure", "Dataset", "Model"], values="value", aggfunc="mean")
    df_res = df_res.rename(MEASURE_NAME_DICT, axis="index")
    return df_res.rename(PIVOT_COL_DICT, axis="columns")

### Results for Group Separation Experiments

#### Random Label Test Results

In [7]:
get_agg_pivot_table("label_test", ["cora", "flickr", "ogbn-arxiv"])

Measure,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate
Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignCos,0.278,0.289,0.287,0.183,0.513,0.275,0.459,0.467,0.464,0.427,0.414,0.389,0.399,0.145,0.492,0.196,0.198,0.348
CKA,0.274,0.273,0.274,0.141,0.445,0.415,0.728,0.846,0.8,0.489,0.477,0.473,0.43,0.142,0.222,0.053,0.021,0.026
ConcDiff,0.212,0.131,0.198,0.156,0.218,0.235,0.505,0.518,0.543,0.36,0.495,0.328,0.43,0.347,0.245,0.124,0.144,0.119
DistCorr,0.274,0.28,0.287,0.116,0.491,0.308,0.722,0.804,0.822,0.479,0.427,0.397,0.454,0.123,0.354,0.061,0.031,0.03
EOS,0.132,0.16,0.168,0.123,0.268,0.284,0.222,0.17,0.276,0.456,0.457,0.48,0.471,0.487,0.426,0.505,0.486,0.474
GULP,0.133,0.16,0.168,0.118,0.106,0.285,0.197,0.194,0.277,0.45,0.448,0.478,0.445,0.494,0.428,0.476,0.503,0.468
HardCorr,0.27,0.272,0.273,0.191,0.389,0.332,0.334,0.52,0.515,0.5,0.483,0.474,0.374,0.148,0.288,0.324,0.163,0.152
Jaccard,0.274,0.273,0.273,0.131,0.326,0.296,0.385,0.565,0.283,0.462,0.475,0.49,0.439,0.25,0.371,0.203,0.11,0.486
LinReg,0.286,0.282,0.284,0.125,0.13,0.326,0.297,0.279,0.367,0.399,0.411,0.429,0.482,0.53,0.3,0.437,0.431,0.33
MagDiff,0.185,0.119,0.134,0.11,0.41,0.273,0.172,0.27,0.199,0.359,0.502,0.4,0.509,0.193,0.214,0.355,0.299,0.332


In [8]:
label_test_df = get_agg_pivot_table("label_test", ["cora", "flickr", "ogbn-arxiv"], groups=3)
label_test_df.to_latex("graphs_results_label_test.tex", 
                       **LATEX_FORMAT_DICT
                      )
label_test_df

Measure,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate
Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignCos,0.433,0.457,0.479,0.286,0.839,0.423,0.931,0.981,0.699,0.399,0.341,0.336,0.421,0.064,0.5,0.027,0.004,0.332
CKA,0.424,0.427,0.424,0.27,0.733,0.657,1.0,1.0,1.0,0.493,0.451,0.488,0.458,0.093,0.139,0.0,0.0,0.0
ConcDiff,0.394,0.203,0.391,0.208,0.366,0.57,0.997,0.964,1.0,0.261,0.455,0.219,0.519,0.277,0.152,0.001,0.008,0.0
DistCorr,0.424,0.431,0.444,0.217,0.86,0.427,1.0,1.0,1.0,0.479,0.41,0.369,0.482,0.052,0.442,0.0,0.0,0.0
EOS,0.284,0.295,0.259,0.219,0.413,0.424,0.34,0.253,0.426,0.342,0.351,0.449,0.419,0.5,0.484,0.494,0.502,0.458
GULP,0.285,0.276,0.26,0.227,0.192,0.424,0.303,0.302,0.426,0.341,0.369,0.444,0.429,0.497,0.488,0.435,0.509,0.449
HardCorr,0.424,0.425,0.424,0.332,0.771,0.457,0.544,0.828,0.828,0.492,0.473,0.489,0.333,0.059,0.321,0.234,0.033,0.033
Jaccard,0.427,0.425,0.424,0.292,0.564,0.43,0.778,0.827,0.432,0.447,0.473,0.492,0.432,0.229,0.421,0.071,0.033,0.467
LinReg,0.456,0.492,0.431,0.23,0.223,0.449,0.467,0.444,0.677,0.312,0.287,0.421,0.484,0.511,0.337,0.374,0.373,0.191
MagDiff,0.37,0.199,0.243,0.185,0.661,0.718,0.343,0.551,0.49,0.263,0.488,0.396,0.528,0.108,0.066,0.251,0.173,0.139


In [9]:
get_agg_pivot_table("label_test", ["cora", "flickr", "ogbn-arxiv"], groups=2)

Measure,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate
Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignCos,0.636,0.726,0.696,0.518,1.0,0.586,1.0,1.0,0.587,0.282,0.208,0.252,0.406,0.0,0.5,0.0,0.0,0.496
CKA,0.586,0.595,0.586,0.393,1.0,0.969,1.0,1.0,1.0,0.5,0.432,0.5,0.478,0.0,0.014,0.0,0.0,0.0
ConcDiff,0.928,0.34,0.979,0.348,0.708,1.0,1.0,0.946,1.0,0.034,0.418,0.01,0.51,0.14,0.0,0.0,0.024,0.0
DistCorr,0.588,0.605,0.67,0.36,1.0,0.61,1.0,1.0,1.0,0.482,0.38,0.298,0.49,0.0,0.352,0.0,0.0,0.0
EOS,0.741,0.757,0.6,0.333,0.586,0.588,0.586,0.586,0.589,0.1,0.138,0.402,0.448,0.5,0.482,0.5,0.5,0.464
GULP,0.741,0.676,0.603,0.36,0.319,0.587,0.594,0.587,0.591,0.1,0.192,0.388,0.42,0.496,0.49,0.432,0.488,0.454
HardCorr,0.586,0.589,0.586,0.591,1.0,0.83,0.71,1.0,1.0,0.5,0.47,0.5,0.31,0.0,0.142,0.202,0.0,0.0
Jaccard,0.597,0.589,0.586,0.442,0.941,0.6,1.0,1.0,0.586,0.416,0.472,0.5,0.408,0.036,0.4,0.0,0.0,0.5
LinReg,0.752,0.804,0.603,0.364,0.445,0.755,0.594,0.633,0.939,0.142,0.1,0.396,0.472,0.51,0.228,0.432,0.332,0.06
MagDiff,0.861,0.353,0.464,0.296,1.0,1.0,0.555,0.328,0.761,0.056,0.46,0.256,0.526,0.0,0.0,0.198,0.512,0.098


#### Shortcut Test Results

In [10]:
get_agg_pivot_table("shortcut_test", ["cora", "flickr", "ogbn-arxiv"])

Measure,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate
Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignCos,0.117,0.145,0.211,0.251,0.372,0.467,0.895,0.855,0.635,0.495,0.402,0.249,0.339,0.124,0.11,0.009,0.022,0.119
CKA,0.226,0.134,0.303,0.166,0.146,0.659,0.83,0.732,0.525,0.403,0.402,0.198,0.434,0.45,0.04,0.02,0.028,0.118
ConcDiff,0.095,0.151,0.094,0.178,0.135,0.144,0.709,0.61,0.727,0.547,0.535,0.573,0.406,0.482,0.385,0.051,0.068,0.054
DistCorr,0.222,0.142,0.37,0.145,0.16,0.749,0.849,0.897,0.538,0.41,0.386,0.177,0.382,0.356,0.032,0.019,0.012,0.112
EOS,0.085,0.107,0.188,0.317,0.206,0.286,0.602,0.458,0.507,0.593,0.466,0.381,0.304,0.232,0.36,0.076,0.096,0.193
GULP,0.088,0.103,0.188,0.24,0.09,0.286,0.602,0.425,0.507,0.585,0.483,0.377,0.291,0.521,0.361,0.077,0.124,0.193
HardCorr,0.107,0.096,0.18,0.3,0.204,0.435,0.356,0.3,0.361,0.465,0.507,0.285,0.302,0.252,0.117,0.12,0.153,0.298
Jaccard,0.172,0.145,0.347,0.319,0.616,0.504,0.622,0.762,0.599,0.346,0.399,0.217,0.274,0.066,0.126,0.057,0.029,0.096
LinReg,0.157,0.139,0.364,0.191,0.211,0.424,0.8,0.556,0.562,0.418,0.438,0.175,0.33,0.34,0.204,0.028,0.077,0.115
MagDiff,0.091,0.137,0.091,0.113,0.177,0.606,0.704,0.356,0.525,0.543,0.533,0.572,0.509,0.357,0.139,0.051,0.245,0.154


In [11]:
shortcut_test_df = get_agg_pivot_table("shortcut_test", ["cora", "flickr", "ogbn-arxiv"], groups=3)
shortcut_test_df.to_latex("graphs_results_shortcut_test.tex", 
                       **LATEX_FORMAT_DICT
                      )
shortcut_test_df

Measure,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate
Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignCos,0.303,0.319,0.599,0.48,0.895,1.0,1.0,1.0,1.0,0.411,0.305,0.119,0.231,0.019,0.0,0.0,0.0,0.0
CKA,0.463,0.273,0.777,0.33,0.282,1.0,1.0,1.0,0.981,0.364,0.339,0.097,0.348,0.428,0.0,0.0,0.0,0.004
ConcDiff,0.204,0.182,0.169,0.324,0.182,0.176,1.0,0.815,0.962,0.502,0.532,0.573,0.393,0.503,0.537,0.0,0.037,0.009
DistCorr,0.459,0.284,0.82,0.317,0.333,1.0,1.0,1.0,0.994,0.378,0.312,0.084,0.282,0.313,0.0,0.0,0.0,0.001
EOS,0.163,0.217,0.495,0.544,0.461,0.433,0.968,1.0,0.724,0.575,0.426,0.26,0.191,0.128,0.4,0.007,0.0,0.167
GULP,0.172,0.197,0.496,0.451,0.196,0.433,0.965,0.986,0.724,0.561,0.475,0.261,0.189,0.508,0.4,0.009,0.003,0.167
HardCorr,0.219,0.2,0.347,0.519,0.549,1.0,0.835,0.798,0.724,0.419,0.441,0.232,0.192,0.171,0.0,0.031,0.039,0.167
Jaccard,0.38,0.305,0.782,0.545,1.0,0.828,1.0,1.0,1.0,0.286,0.303,0.071,0.16,0.0,0.037,0.0,0.0,0.0
LinReg,0.334,0.299,0.742,0.357,0.365,0.609,1.0,1.0,1.0,0.376,0.383,0.053,0.277,0.297,0.189,0.0,0.0,0.0
MagDiff,0.187,0.267,0.151,0.198,0.266,0.783,1.0,0.55,0.535,0.511,0.519,0.585,0.523,0.331,0.114,0.0,0.18,0.176


In [12]:
get_agg_pivot_table("shortcut_test", ["cora", "flickr", "ogbn-arxiv"], groups=2)

Measure,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate
Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignCos,0.665,0.875,0.99,0.743,1.0,1.0,1.0,1.0,1.0,0.222,0.06,0.004,0.144,0.0,0.0,0.0,0.0,0.0
CKA,0.705,0.723,1.0,0.658,0.509,1.0,1.0,1.0,1.0,0.248,0.164,0.0,0.268,0.366,0.0,0.0,0.0,0.0
ConcDiff,0.314,0.281,0.312,0.49,0.35,0.359,1.0,1.0,1.0,0.488,0.572,0.56,0.424,0.47,0.522,0.0,0.0,0.0
DistCorr,0.698,0.809,1.0,0.599,0.684,1.0,1.0,1.0,1.0,0.258,0.13,0.0,0.184,0.214,0.0,0.0,0.0,0.0
EOS,0.312,0.425,0.946,0.918,1.0,0.586,1.0,1.0,1.0,0.534,0.298,0.02,0.03,0.0,0.5,0.0,0.0,0.0
GULP,0.324,0.351,0.937,0.965,0.351,0.586,1.0,1.0,1.0,0.522,0.384,0.024,0.014,0.472,0.5,0.0,0.0,0.0
HardCorr,0.435,0.424,1.0,0.992,1.0,1.0,1.0,1.0,1.0,0.262,0.306,0.0,0.004,0.0,0.0,0.0,0.0,0.0
Jaccard,0.814,0.834,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.056,0.076,0.0,0.0,0.0,0.0,0.0,0.0,0.0
LinReg,0.663,0.663,1.0,0.569,0.53,0.827,1.0,1.0,1.0,0.226,0.2,0.0,0.176,0.298,0.066,0.0,0.0,0.0
MagDiff,0.298,0.484,0.264,0.326,0.655,1.0,1.0,1.0,1.0,0.51,0.53,0.58,0.538,0.132,0.0,0.0,0.0,0.0


#### Augmentation Test Results

In [13]:
get_agg_pivot_table("augmentation_test", ["cora", "flickr", "ogbn-arxiv"])

Measure,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate
Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignCos,0.319,0.207,0.313,0.446,0.778,0.268,0.667,0.314,0.171,0.163,0.335,0.276,0.193,0.049,0.187,0.069,0.152,0.511
CKA,0.461,0.317,0.334,0.265,0.71,0.345,0.624,0.602,0.642,0.104,0.234,0.214,0.237,0.072,0.149,0.08,0.074,0.049
ConcDiff,0.296,0.105,0.302,0.256,0.208,0.178,0.287,0.177,0.248,0.272,0.493,0.356,0.269,0.342,0.387,0.251,0.299,0.24
DistCorr,0.46,0.38,0.336,0.336,0.712,0.371,0.643,0.591,0.631,0.096,0.203,0.214,0.193,0.064,0.169,0.074,0.079,0.058
EOS,0.136,0.282,0.324,0.302,0.397,0.231,0.465,0.37,0.175,0.341,0.276,0.233,0.302,0.165,0.341,0.093,0.165,0.419
GULP,0.138,0.208,0.326,0.462,0.12,0.238,0.502,0.148,0.176,0.336,0.332,0.225,0.161,0.486,0.336,0.102,0.357,0.415
HardCorr,0.277,0.243,0.322,0.444,0.69,0.305,0.184,0.139,0.148,0.32,0.279,0.24,0.168,0.072,0.222,0.389,0.502,0.424
Jaccard,0.473,0.377,0.354,0.539,0.846,0.459,0.758,0.566,0.439,0.081,0.183,0.182,0.134,0.035,0.153,0.031,0.053,0.114
LinReg,0.407,0.457,0.379,0.284,0.186,0.345,0.495,0.229,0.205,0.103,0.096,0.149,0.261,0.466,0.22,0.098,0.265,0.278
MagDiff,0.347,0.128,0.173,0.27,0.46,0.094,0.393,0.404,0.995,0.262,0.451,0.391,0.342,0.165,0.54,0.164,0.192,0.001


In [14]:
aug_test_df = get_agg_pivot_table("augmentation_test", ["cora", "flickr", "ogbn-arxiv"], groups=3)
aug_test_df.to_latex("graphs_results_augmentation_test.tex", 
                       **LATEX_FORMAT_DICT
                      )
aug_test_df

Measure,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate
Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignCos,0.908,0.51,0.635,0.544,0.686,0.698,1.0,0.736,0.427,0.022,0.217,0.119,0.192,0.13,0.099,0.0,0.129,0.464
CKA,0.906,0.697,0.731,0.508,0.572,0.747,0.987,0.997,1.0,0.035,0.103,0.081,0.264,0.173,0.088,0.003,0.001,0.0
ConcDiff,0.623,0.174,0.504,0.534,0.412,0.348,0.508,0.426,0.533,0.133,0.508,0.219,0.258,0.221,0.319,0.16,0.24,0.196
DistCorr,0.891,0.785,0.732,0.609,0.602,0.794,0.989,1.0,1.0,0.035,0.071,0.088,0.188,0.162,0.059,0.003,0.0,0.0
EOS,0.342,0.535,0.618,0.459,0.679,0.529,1.0,0.819,0.488,0.248,0.143,0.104,0.297,0.125,0.203,0.0,0.035,0.25
GULP,0.349,0.448,0.612,0.555,0.223,0.542,1.0,0.557,0.484,0.237,0.21,0.109,0.161,0.477,0.191,0.0,0.195,0.255
HardCorr,0.513,0.512,0.633,0.571,0.712,0.716,0.536,0.466,0.506,0.195,0.151,0.105,0.149,0.106,0.084,0.208,0.413,0.232
Jaccard,0.953,0.781,0.807,0.58,0.743,0.88,1.0,1.0,0.991,0.016,0.096,0.054,0.159,0.115,0.027,0.0,0.0,0.002
LinReg,0.872,0.943,0.85,0.338,0.302,0.805,0.809,0.724,0.724,0.048,0.017,0.037,0.309,0.473,0.067,0.07,0.165,0.166
MagDiff,0.535,0.204,0.39,0.43,0.588,0.174,0.693,0.771,1.0,0.173,0.485,0.258,0.341,0.132,0.551,0.094,0.067,0.0


In [15]:
get_agg_pivot_table("augmentation_test", ["cora", "flickr", "ogbn-arxiv"], groups=2)

Measure,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,AUPRC,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate
Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignCos,1.0,0.979,0.99,0.899,1.0,1.0,1.0,1.0,0.593,0.0,0.01,0.004,0.048,0.0,0.0,0.0,0.0,0.438
CKA,1.0,1.0,1.0,0.827,0.995,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.108,0.002,0.0,0.0,0.0,0.0
ConcDiff,0.906,0.306,0.88,0.808,0.882,0.517,0.784,0.899,0.988,0.05,0.474,0.088,0.208,0.066,0.248,0.108,0.05,0.006
DistCorr,1.0,1.0,1.0,0.924,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.042,0.0,0.0,0.0,0.0,0.0
EOS,0.995,0.995,1.0,0.671,0.946,1.0,1.0,1.0,1.0,0.002,0.002,0.0,0.186,0.03,0.0,0.0,0.0,0.0
GULP,0.995,0.808,1.0,1.0,0.36,1.0,1.0,0.797,1.0,0.002,0.08,0.0,0.0,0.44,0.0,0.0,0.074,0.0
HardCorr,0.986,1.0,1.0,0.99,1.0,1.0,0.995,0.586,1.0,0.008,0.0,0.0,0.004,0.0,0.0,0.002,0.5,0.0
Jaccard,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
LinReg,1.0,1.0,1.0,0.754,0.347,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.132,0.476,0.0,0.0,0.0,0.0
MagDiff,1.0,0.36,0.447,0.627,1.0,0.32,1.0,1.0,1.0,0.0,0.516,0.298,0.308,0.0,0.546,0.0,0.0,0.0


#### Layer Monotonicity Test Results

In [16]:
layer_test_df = get_agg_pivot_table("layer_test", ["cora", "flickr", "ogbn-arxiv"])
layer_test_df.to_latex("graphs_results_layer_test.tex", 
                       **LATEX_FORMAT_DICT
                      )
layer_test_df

Measure,Spearman Correlation,Spearman Correlation,Spearman Correlation,Spearman Correlation,Spearman Correlation,Spearman Correlation,Spearman Correlation,Spearman Correlation,Spearman Correlation,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate,Violation Rate
Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignCos,1.0,0.98,1.0,0.04,0.327,0.68,0.837,0.843,0.933,0.0,0.03,0.0,0.54,0.41,0.23,0.11,0.17,0.07
CKA,1.0,0.98,1.0,0.387,0.603,0.89,0.96,0.85,0.457,0.0,0.02,0.0,0.41,0.21,0.08,0.05,0.13,0.36
ConcDiff,0.403,0.85,0.25,0.243,0.383,-0.273,0.397,0.733,0.39,0.38,0.15,0.48,0.42,0.43,0.64,0.33,0.3,0.26
DistCorr,1.0,1.0,1.0,0.467,0.63,0.993,0.933,0.807,0.523,0.0,0.0,0.0,0.37,0.19,0.01,0.08,0.12,0.35
EOS,1.0,1.0,1.0,0.917,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.08,0.0,0.0,0.0,0.0,0.0
GULP,1.0,1.0,1.0,0.33,0.54,1.0,1.0,0.733,1.0,0.0,0.0,0.0,0.28,0.17,0.0,0.0,0.18,0.0
HardCorr,0.54,0.833,0.983,0.213,0.627,0.803,1.0,0.833,0.62,0.24,0.09,0.01,0.32,0.19,0.16,0.0,0.14,0.28
Jaccard,1.0,1.0,1.0,0.953,0.95,0.973,1.0,0.973,0.987,0.0,0.0,0.0,0.04,0.06,0.04,0.0,0.04,0.02
LinReg,1.0,1.0,1.0,0.03,0.45,1.0,1.0,0.993,1.0,0.0,0.0,0.0,0.41,0.33,0.0,0.0,0.01,0.0
MagDiff,0.893,0.55,0.49,0.383,0.583,0.5,0.633,0.06,0.29,0.08,0.37,0.28,0.42,0.35,0.37,0.13,0.48,0.29


### Results of Output Correlations

In [17]:
def OUTPUT_DF_FILE_NAME(dataset):
    return f"output_correlation_test_{dataset}_full.csv"

In [18]:
def get_output_correlation_table(datasets, corr_func="spearmanr", acc_test = False):
    dfs = []
    for dataset in datasets:
        path = os.path.join(EXPERIMENT_RESULTS_PATH, OUTPUT_DF_FILE_NAME(dataset))
        df = pd.read_csv(path)
        df = df.loc[df.loc[:,"quality_measure"] == corr_func]
        data = df.loc[:, ["similarity_measure", "functional_similarity_measure", "corr", "architecture"]]
        data = data.rename(COLUMN_NAME_DICT, axis="columns")
        data["Dataset"] = dataset
        dfs.append(data.iloc[:])

    df_cc = pd.concat(dfs, axis=0)
    df_res = df_cc.pivot_table(index="Similarity Measure", columns=["Measure", "Dataset", "Model"], values="corr", aggfunc="mean")
    df_res = df_res.rename(MEASURE_NAME_DICT, axis="index")
    df_res = df_res.rename(PIVOT_COL_DICT, axis="columns")
    if acc_test: 
        return df_res.loc[:,"AbsoluteAccDiff"]
        
    return df_res.loc[:,["Disagreement", "JSD"]]

In [19]:
output_corr_df = get_output_correlation_table(["cora", "flickr", "ogbn-arxiv"])
output_corr_df.to_latex("graphs_results_output_correlation_test.tex", 
                       **LATEX_FORMAT_DICT
                      )
output_corr_df

Measure,Disagreement,Disagreement,Disagreement,Disagreement,Disagreement,Disagreement,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,JSD,JSD,JSD,JSD,JSD,JSD
Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignCos,-0.051,-0.084,0.271,-0.083,0.147,0.374,0.166,-0.098,0.001,0.174,0.017,0.384,-0.013,0.306,0.443,0.275,-0.026,0.05
CKA,0.445,0.363,0.001,0.061,-0.211,0.534,0.227,0.029,-0.041,0.535,0.435,-0.031,0.166,0.029,0.576,0.381,0.119,-0.021
ConcDiff,0.03,-0.038,-0.097,0.029,-0.214,-0.043,-0.16,-0.254,0.072,0.014,0.032,0.041,0.028,-0.172,-0.034,-0.215,-0.13,0.024
DistCorr,0.456,0.529,-0.078,-0.031,0.172,0.395,0.204,0.11,0.081,0.601,0.597,0.053,0.031,0.456,0.431,0.361,0.163,0.122
EOS,-0.088,0.127,0.023,0.231,0.025,0.334,0.119,-0.255,-0.023,-0.036,0.168,0.224,0.114,-0.027,0.385,0.369,-0.166,0.115
GULP,-0.129,-0.165,-0.09,-0.006,0.029,0.334,0.099,0.154,-0.037,-0.042,-0.096,0.182,0.128,0.149,0.383,0.353,0.098,0.106
HardCorr,0.261,0.454,0.104,-0.093,0.395,0.458,0.239,0.02,-0.241,0.516,0.479,0.162,0.095,0.534,0.505,0.46,-0.046,-0.276
Jaccard,0.12,0.436,0.333,-0.004,0.037,0.419,0.219,0.142,0.012,0.379,0.441,0.453,0.107,0.331,0.421,0.367,0.2,0.09
LinReg,-0.062,0.574,0.09,0.063,0.119,0.457,0.221,-0.099,-0.188,0.19,0.58,0.331,0.176,0.152,0.477,0.465,-0.089,-0.166
MagDiff,-0.069,-0.073,-0.253,-0.198,0.056,0.065,0.216,-0.252,-0.195,-0.145,0.004,0.063,-0.262,0.032,0.056,0.079,-0.126,-0.127


In [20]:
acc_corr_df = get_output_correlation_table(["cora", "flickr", "ogbn-arxiv"], acc_test=True)
acc_corr_df.to_latex("graphs_results_accuracy_correlation_test.tex", 
                       **LATEX_FORMAT_DICT
                      )
acc_corr_df

Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2
AlignCos,-0.369,-0.188,0.154,0.088,0.173,0.388,-0.185,-0.069,0.201
CKA,-0.08,-0.31,-0.134,-0.095,-0.15,0.372,-0.129,0.04,0.056
ConcDiff,-0.098,-0.021,-0.213,0.078,-0.11,-0.06,-0.191,-0.247,-0.004
DistCorr,-0.112,-0.299,-0.126,-0.041,0.2,0.36,-0.127,0.138,0.01
EOS,-0.002,0.29,0.085,0.399,0.227,0.224,0.048,-0.05,0.01
GULP,-0.037,0.245,0.085,-0.087,0.041,0.215,0.052,-0.185,-0.013
HardCorr,-0.261,0.03,-0.116,-0.145,0.177,0.323,0.064,0.132,-0.04
Jaccard,-0.226,-0.042,-0.1,-0.057,0.079,0.074,-0.145,-0.275,-0.132
LinReg,-0.205,0.009,-0.206,-0.115,-0.228,0.277,0.049,-0.229,-0.021
MagDiff,-0.073,0.051,-0.106,0.101,0.178,-0.006,-0.101,-0.214,0.033


### CD Plots

In [21]:
# autorank package needed for creation of CD plots 
from autorank import autorank, plot_stats, create_report, latex_table
from autorank._util import *
from matplotlib import pyplot as plt

In [22]:
def get_figsize(columnwidth, wf=0.5, hf=(5. ** 0.5 - 1.0) / 2.0):
    """ Credit: https://stackoverflow.com/a/31527287
    Parameters:
      - wf [float]:  width fraction in columnwidth units
      - hf [float]:  height fraction in columnwidth units.
                     Set by default to golden ratio.
      - columnwidth [float]: width of the column in latex. Get this from LaTeX
                             using \showthe\columnwidth
    Returns:  [fig_width,fig_height]: that should be given to matplotlib
    """
    fig_width_pt = columnwidth * wf
    inches_per_pt = 1.0 / 72.27  # Convert pt to inch
    fig_width = fig_width_pt * inches_per_pt  # width in inches
    fig_height = fig_width * hf  # height in inches
    return fig_width, fig_height

PLOTS_BASE_WIDTH = 433.62  # pt
PLOTS_CD_WIDTH, PLOTS_CD_HEIGHT = get_figsize(PLOTS_BASE_WIDTH, wf=1.5)

In [23]:
def get_autorank_df(experiments=EXPERIMENTS, datasets=DATASETS, quality_measure = "violation_rate"):
    dfs = []
    for experiment in experiments:
        df = get_agg_pivot_table(experiment, datasets)        
        if experiment == "layer_test":
            dfs.append(df.loc[:,"Spearman Correlation"].dropna())
        else:
            dfs.append(df.loc[:,"AUPRC"].dropna())
    df_out = get_output_correlation_table(datasets).dropna()
    dfs.append(df_out.loc[:,"JSD"])
    df_acc = get_output_correlation_table(datasets, acc_test=True).dropna()
    dfs.append(df_acc)
    return pd.concat(dfs, axis=1)


In [24]:
get_autorank_df(datasets=["cora", "flickr", "ogbn-arxiv"])

Dataset,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv,Cora,...,OGBN-Arxiv,Cora,Cora,Cora,Flickr,Flickr,Flickr,OGBN-Arxiv,OGBN-Arxiv,OGBN-Arxiv
Model,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,...,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE,GAT,GCN,SAGE
Similarity Measure,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2
AlignCos,0.278,0.289,0.287,0.183,0.513,0.275,0.459,0.467,0.464,1.0,...,0.05,-0.369,-0.188,0.154,0.088,0.173,0.388,-0.185,-0.069,0.201
CKA,0.274,0.273,0.274,0.141,0.445,0.415,0.728,0.846,0.8,1.0,...,-0.021,-0.08,-0.31,-0.134,-0.095,-0.15,0.372,-0.129,0.04,0.056
ConcDiff,0.212,0.131,0.198,0.156,0.218,0.235,0.505,0.518,0.543,0.403,...,0.024,-0.098,-0.021,-0.213,0.078,-0.11,-0.06,-0.191,-0.247,-0.004
DistCorr,0.274,0.28,0.287,0.116,0.491,0.308,0.722,0.804,0.822,1.0,...,0.122,-0.112,-0.299,-0.126,-0.041,0.2,0.36,-0.127,0.138,0.01
EOS,0.132,0.16,0.168,0.123,0.268,0.284,0.222,0.17,0.276,1.0,...,0.115,-0.002,0.29,0.085,0.399,0.227,0.224,0.048,-0.05,0.01
GULP,0.133,0.16,0.168,0.118,0.106,0.285,0.197,0.194,0.277,1.0,...,0.106,-0.037,0.245,0.085,-0.087,0.041,0.215,0.052,-0.185,-0.013
HardCorr,0.27,0.272,0.273,0.191,0.389,0.332,0.334,0.52,0.515,0.54,...,-0.276,-0.261,0.03,-0.116,-0.145,0.177,0.323,0.064,0.132,-0.04
Jaccard,0.274,0.273,0.273,0.131,0.326,0.296,0.385,0.565,0.283,1.0,...,0.09,-0.226,-0.042,-0.1,-0.057,0.079,0.074,-0.145,-0.275,-0.132
LinReg,0.286,0.282,0.284,0.125,0.13,0.326,0.297,0.279,0.367,1.0,...,-0.166,-0.205,0.009,-0.206,-0.115,-0.228,0.277,0.049,-0.229,-0.021
MagDiff,0.185,0.119,0.134,0.11,0.41,0.273,0.172,0.27,0.199,0.893,...,-0.127,-0.073,0.051,-0.106,0.101,0.178,-0.006,-0.101,-0.214,0.033


In [32]:
res_df = get_autorank_df().T.reset_index(drop=True)
result = autorank(res_df, alpha=0.05, verbose=False)
cd_diagram(result, False, None, PLOTS_CD_WIDTH)
fig = plt.gcf()
fig.set_size_inches(PLOTS_CD_WIDTH, PLOTS_CD_HEIGHT)
plt.savefig(f"cd_plot_graphs.png", bbox_inches="tight")
plt.close()

  if abs(sorted_ranks[i] - sorted_ranks[j]) <= critical_difference:
  plot_line([(rankpos(sorted_ranks[i]), cline),
  (rankpos(sorted_ranks[i]), chei),
  plot_line([(rankpos(sorted_ranks[i]), cline),
  (rankpos(sorted_ranks[i]), chei),
  plot_line([(rankpos(sorted_ranks[l]) - side, start),
  (rankpos(sorted_ranks[r]) + side, start)],


In [29]:
get_autorank_df().T.reset_index(drop=True).shape

(54, 20)