In [1]:
import pandas as pd
import itertools
import os

### Results for Group Separation Experiments

In [2]:
EXPERIMENT_RESULTS_PATH = 'C:/Users/Tobias/Eigene Dokumente/Research/similaritybench/experiments/results'
COMPARISON_TYPE_DICT = {
    "label_test": "group_separation",
    "layer_test": "monotonicity",
    "augmentation_test": "group_separation",
    "shortcut_test": "group_separation"
}

EXPERIMENTS = list(COMPARISON_TYPE_DICT.keys())
DATASETS = ["cora", "flickr", "ogbn-arxiv"]
ARCHITECTURES = ["GCN", "GraphSAGE", "GAT"]

def FULL_DF_FILE_NAME(experiment, comparison_type, dataset, groups=5):
    if reduced:
        return f"{experiment}_{comparison_type}_{dataset}_{groups}groups_full.csv"
    return f"{experiment}_{comparison_type}_{dataset}_full.csv"

In [3]:
def get_pivot_table(experiment, dataset):
    path = os.path.join(EXPERIMENT_RESULTS_PATH, FULL_DF_FILE_NAME(experiment, COMPARISON_TYPE_DICT[experiment], dataset))
    
    df = pd.read_csv(path)
    data = df.loc[:, ["similarity_measure", "quality_measure", "value", "architecture", "representation_dataset"]]
    return data.pivot(index="similarity_measure", columns=["representation_dataset", "architecture", "quality_measure"], values="value")

In [4]:
def get_agg_pivot_table(experiment, datasets, groups=5):
    dfs = []
    for dataset in datasets:
        path = os.path.join(EXPERIMENT_RESULTS_PATH, FULL_DF_FILE_NAME(experiment, COMPARISON_TYPE_DICT[experiment], dataset, groups))
        df = pd.read_csv(path)
        data = df.loc[:, ["similarity_measure", "quality_measure", "value", "architecture", "representation_dataset"]]
        dfs.append(data.iloc[:])
    df_cc = pd.concat(dfs, axis=0)
    return df_cc.pivot_table(index="similarity_measure", columns=["representation_dataset", "architecture", "quality_measure"], values="value", aggfunc="mean")

In [5]:
get_agg_pivot_table("label_test", ["cora", "flickr", "ogbn-arxiv"])

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.277452,0.447,0.296727,0.3768,0.281042,0.4118,0.141449,0.4726,0.461096,0.1504,0.277374,0.489,0.462207,0.198,0.471147,0.2198,0.436345,0.3446
CKA,0.274583,0.4866,0.273912,0.4736,0.274771,0.4686,0.129954,0.4808,0.342134,0.1608,0.43229,0.2202,0.726076,0.054,0.865779,0.0166,0.831647,0.0266
ConcentricityDifference,0.183074,0.3736,0.136865,0.4066,0.162598,0.3874,0.115978,0.4802,0.125012,0.4692,0.291945,0.2494,0.41341,0.167,0.327325,0.1946,0.569148,0.1006
DistanceCorrelation,0.274829,0.4788,0.281172,0.427,0.289221,0.3882,0.121305,0.474,0.421418,0.131,0.312483,0.3532,0.659332,0.0702,0.848036,0.021,0.803045,0.0352
EigenspaceOverlapScore,0.281568,0.382,0.272522,0.4294,0.273769,0.4544,0.128491,0.4742,0.275875,0.4822,0.284937,0.4234,0.275617,0.4944,0.272975,0.4874,0.276387,0.4606
Gulp,0.28136,0.3846,0.27677,0.4158,0.274428,0.4518,0.111432,0.4738,0.103242,0.5408,0.285205,0.4222,0.282807,0.4716,0.138971,0.4734,0.277413,0.4472
HardCorrelationMatch,0.2707,0.4956,0.271883,0.479,0.27331,0.4734,0.167077,0.3592,0.383127,0.1364,0.339107,0.2926,0.361708,0.3126,0.539895,0.1426,0.548372,0.1502
JaccardSimilarity,0.277164,0.4368,0.271703,0.4868,0.273186,0.4854,0.124418,0.4094,0.326535,0.2468,0.313439,0.316,0.351645,0.2138,0.683794,0.0728,0.288993,0.4846
LinearRegression,0.277083,0.4362,0.28261,0.4044,0.287879,0.4182,0.138999,0.464,0.157891,0.5308,0.340979,0.3042,0.302403,0.4556,0.283791,0.4028,0.369216,0.3278
MagnitudeDifference,0.165867,0.3734,0.11468,0.4668,0.176162,0.4248,0.104497,0.5308,0.455037,0.1564,0.3125,0.2016,0.176992,0.385,0.160646,0.3824,0.190985,0.388


In [6]:
get_agg_pivot_table("label_test", ["cora", "flickr", "ogbn-arxiv"], reduced=True)

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.419821,0.456667,0.494788,0.355333,0.427998,0.413333,0.285138,0.414667,0.666078,0.124,0.42497,0.49,0.736343,0.127333,0.782962,0.079333,0.691321,0.313333
CKA,0.419536,0.47,0.416974,0.468,0.421428,0.454667,0.299507,0.435333,0.68768,0.102667,0.663444,0.166,1.0,0.0,1.0,0.0,1.0,0.0
ConcentricityDifference,0.395347,0.266,0.244622,0.366667,0.365555,0.278,0.204123,0.473333,0.284699,0.422667,0.494268,0.204667,0.631512,0.092,0.649944,0.108667,0.99697,0.000667
DistanceCorrelation,0.418925,0.468667,0.426573,0.434667,0.48302,0.377333,0.260617,0.423333,0.744248,0.070667,0.514263,0.386,1.0,0.0,1.0,0.0,1.0,0.0
EigenspaceOverlapScore,0.476001,0.256,0.456515,0.313333,0.42564,0.44,0.273183,0.412,0.419621,0.488,0.45934,0.412,0.423206,0.5,0.424556,0.476667,0.426132,0.452
Gulp,0.475085,0.255333,0.476787,0.281333,0.426779,0.436667,0.234366,0.436,0.20499,0.530667,0.459449,0.411333,0.426772,0.474667,0.270213,0.484667,0.428979,0.426667
HardCorrelationMatch,0.419056,0.468,0.415229,0.478,0.422712,0.452,0.326965,0.278667,0.64508,0.104,0.575902,0.265333,0.715813,0.196,1.0,0.0,1.0,0.0
JaccardSimilarity,0.428521,0.422667,0.418521,0.472,0.417107,0.486,0.26308,0.341333,0.495149,0.233333,0.493502,0.315333,0.741675,0.111333,0.986247,0.003333,0.424167,0.492667
LinearRegression,0.446764,0.390667,0.483585,0.304667,0.44409,0.42,0.219352,0.421333,0.232107,0.516667,0.541855,0.291333,0.438774,0.448,0.448461,0.343333,0.654398,0.194667
MagnitudeDifference,0.356165,0.279333,0.19909,0.485333,0.269929,0.402,0.20158,0.500667,0.756744,0.133333,0.585883,0.138,0.290573,0.386667,0.193346,0.504667,0.345856,0.303333


In [7]:
get_agg_pivot_table("layer_test", ["cora", "flickr", "ogbn-arxiv"])

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.810646,0.1,0.947177,0.054762,0.888639,0.090476,0.48585,0.246429,0.522619,0.394048,0.812619,0.170238,0.443469,0.245238,0.933435,0.085714,0.66398,0.227381
CKA,0.997449,0.004762,0.972143,0.032143,0.982687,0.030952,0.464558,0.314286,0.360068,0.353571,0.895816,0.119048,0.85068,0.115476,0.743946,0.104762,0.949932,0.07381
ConcentricityDifference,0.640306,0.122619,0.717585,0.214286,0.229694,0.440476,0.609074,0.160714,0.344524,0.469048,0.056769,0.494048,0.387612,0.24881,0.545442,0.325,0.421122,0.413095
DistanceCorrelation,0.998469,0.003571,0.988639,0.005952,0.998299,0.004762,0.431565,0.340476,0.644694,0.232143,0.992483,0.015476,0.887959,0.083333,0.728027,0.115476,0.923673,0.103571
EigenspaceOverlapScore,1.0,0.0,1.0,0.0,1.0,0.0,0.792223,0.089286,0.975816,0.015476,0.994218,0.010714,0.906219,0.082143,0.785884,0.052381,0.989694,0.021429
Gulp,0.719048,0.091667,0.930612,0.028571,1.0,0.0,0.23898,0.397619,0.441429,0.289286,0.802619,0.077381,0.348707,0.369048,0.855374,0.113095,0.994558,0.014286
HardCorrelationMatch,0.905782,0.066667,0.914456,0.047619,0.929592,0.078571,0.642925,0.204762,0.515204,0.291667,0.836667,0.167857,0.898435,0.114286,0.929252,0.082143,0.877993,0.125
JaccardSimilarity,0.998299,0.005952,1.0,0.0,0.99966,0.00119,0.942211,0.059524,0.985238,0.02381,0.964626,0.055952,0.986054,0.020238,0.983844,0.027381,0.947279,0.07619
LinearRegression,0.878776,0.045238,0.996803,0.007143,1.0,0.0,0.237517,0.39881,0.359184,0.344048,0.693469,0.090476,0.24932,0.383333,0.967925,0.02619,0.99966,0.00119
MagnitudeDifference,0.930306,0.083333,0.345,0.409524,0.573129,0.344048,0.58585,0.361905,0.673367,0.264286,0.498095,0.358333,0.324592,0.313095,0.477415,0.305952,0.568435,0.163095


In [5]:
get_agg_pivot_table("shortcut_test", ["cora", "flickr", "ogbn-arxiv"])

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.116701,0.4952,0.144859,0.4022,0.210714,0.2494,0.35997,0.338,0.299808,0.2008,0.527227,0.0864,0.566886,0.1088,0.383656,0.1406,0.944316,0.0084
CKA,0.226215,0.4034,0.134421,0.4016,0.303313,0.198,0.117855,0.4684,0.123737,0.4634,0.46545,0.1062,0.579315,0.0796,0.444151,0.1314,0.873149,0.0322
ConcentricityDifference,0.095087,0.5468,0.151224,0.5348,0.094332,0.573,0.154738,0.3804,0.137792,0.522,0.458561,0.1086,0.391127,0.1934,0.303171,0.327,0.711618,0.0552
DistanceCorrelation,0.221667,0.4104,0.142364,0.3862,0.370273,0.177,0.128919,0.4312,0.175935,0.33,0.460491,0.1126,0.564012,0.0904,0.44317,0.132,0.884731,0.0266
EigenspaceOverlapScore,0.084755,0.5932,0.107221,0.4662,0.187584,0.3808,0.281368,0.404,0.140166,0.3292,0.319582,0.2624,0.411037,0.1702,0.244117,0.2108,0.527321,0.0588
Gulp,0.08826,0.5852,0.103083,0.4828,0.187679,0.3768,0.16114,0.356,0.110683,0.533,0.277657,0.4064,0.411573,0.1682,0.225199,0.2304,0.462335,0.103
HardCorrelationMatch,0.107221,0.4652,0.095984,0.5066,0.180108,0.2854,0.332267,0.2788,0.208394,0.2648,0.546456,0.0892,0.442824,0.1052,0.216439,0.2564,0.703211,0.0278
JaccardSimilarity,0.172286,0.346,0.144966,0.3994,0.346899,0.2174,0.308633,0.285,0.430379,0.119,0.385761,0.1678,0.508573,0.1324,0.455164,0.1236,0.971198,0.0032
LinearRegression,0.157208,0.418,0.13934,0.4376,0.363778,0.175,0.159012,0.4262,0.192686,0.3388,0.356119,0.2138,0.500928,0.1018,0.343531,0.2012,0.561853,0.069
MagnitudeDifference,0.091114,0.5432,0.137015,0.5326,0.090777,0.5716,0.13329,0.4308,0.127935,0.4626,0.569959,0.1374,0.383388,0.1804,0.162774,0.3482,0.296801,0.1894


In [6]:
get_agg_pivot_table("shortcut_test", ["cora", "flickr", "ogbn-arxiv"], reduced=True)

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.302898,0.411333,0.318647,0.305333,0.598752,0.118667,0.479826,0.231333,0.894714,0.019333,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
CKA,0.46266,0.364,0.272784,0.338667,0.776866,0.096667,0.330272,0.348,0.281582,0.428,1.0,0.0,1.0,0.0,1.0,0.0,0.981104,0.004
ConcentricityDifference,0.204222,0.502,0.182471,0.532,0.168895,0.573333,0.324453,0.392667,0.182249,0.503333,0.176244,0.536667,1.0,0.0,0.814892,0.036667,0.961912,0.009333
DistanceCorrelation,0.459166,0.378,0.283945,0.312,0.819571,0.084,0.31707,0.282,0.332822,0.313333,1.0,0.0,1.0,0.0,1.0,0.0,0.994444,0.001333
EigenspaceOverlapScore,0.163367,0.575333,0.216938,0.426,0.495157,0.26,0.544425,0.190667,0.460572,0.128,0.432888,0.4,0.968069,0.007333,1.0,0.0,0.724314,0.166667
Gulp,0.172056,0.560667,0.197004,0.474667,0.495904,0.260667,0.451336,0.189333,0.196031,0.508,0.432888,0.4,0.964558,0.008667,0.985766,0.002667,0.724314,0.166667
HardCorrelationMatch,0.219276,0.418667,0.200268,0.441333,0.347125,0.232,0.518523,0.192,0.549104,0.171333,1.0,0.0,0.834909,0.030667,0.798304,0.038667,0.724314,0.166667
JaccardSimilarity,0.379688,0.286,0.305227,0.303333,0.782344,0.070667,0.544567,0.16,1.0,0.0,0.827864,0.037333,1.0,0.0,1.0,0.0,1.0,0.0
LinearRegression,0.333709,0.376,0.299139,0.383333,0.741737,0.053333,0.356838,0.277333,0.365108,0.297333,0.609064,0.188667,1.0,0.0,1.0,0.0,1.0,0.0
MagnitudeDifference,0.187117,0.511333,0.267258,0.519333,0.151357,0.585333,0.197894,0.523333,0.265917,0.330667,0.782998,0.114,1.0,0.0,0.549767,0.18,0.534647,0.176


In [9]:
get_agg_pivot_table("augmentation_test", ["cora", "flickr", "ogbn-arxiv"])

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.293559,0.1662,0.158459,0.3958,0.292466,0.3202,0.436004,0.253,0.735944,0.0508,0.229736,0.2046,0.666762,0.0694,0.300382,0.1798,0.169973,0.5124
CKA,0.390306,0.123,0.22338,0.2852,0.294391,0.2318,0.249924,0.285,0.710209,0.0584,0.335225,0.155,0.612986,0.0808,0.52979,0.0798,0.632456,0.0496
ConcentricityDifference,0.228318,0.2942,0.106856,0.488,0.28711,0.3454,0.216544,0.325,0.214372,0.3152,0.158231,0.3714,0.35459,0.2336,0.185267,0.2982,0.211294,0.2976
DistanceCorrelation,0.409174,0.1104,0.289524,0.2332,0.326323,0.223,0.310938,0.2406,0.690684,0.0598,0.351039,0.1776,0.641077,0.0742,0.563156,0.0818,0.610865,0.06
EigenspaceOverlapScore,0.118466,0.392,0.132337,0.3552,0.195475,0.2688,0.297408,0.3308,0.356336,0.1908,0.194295,0.3844,0.353438,0.1134,0.214642,0.2152,0.174435,0.4306
Gulp,0.120187,0.3842,0.132054,0.362,0.203648,0.2598,0.481254,0.202,0.114814,0.4834,0.193566,0.3832,0.391706,0.1222,0.124858,0.3992,0.174545,0.4314
HardCorrelationMatch,0.12555,0.3862,0.131358,0.3606,0.178539,0.2918,0.421316,0.2028,0.640959,0.08,0.276204,0.2526,0.182568,0.4018,0.13759,0.5164,0.144221,0.456
JaccardSimilarity,0.425655,0.0876,0.29521,0.2038,0.343669,0.1912,0.556184,0.1352,0.815834,0.0358,0.402013,0.1626,0.725944,0.034,0.553446,0.054,0.334755,0.1334
LinearRegression,0.317356,0.123,0.341739,0.1158,0.350219,0.1574,0.25313,0.2814,0.177172,0.4874,0.296811,0.2286,0.454151,0.114,0.225098,0.2746,0.20329,0.288
MagnitudeDifference,0.346935,0.2634,0.128563,0.4412,0.201762,0.3622,0.236253,0.3344,0.421046,0.206,0.100563,0.5016,0.363517,0.1952,0.332625,0.2066,0.994667,0.0006


In [10]:
get_agg_pivot_table("augmentation_test", ["cora", "flickr", "ogbn-arxiv"], reduced=True)

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.786291,0.034667,0.359539,0.314667,0.547878,0.188,0.524542,0.26,0.586179,0.134667,0.675858,0.133333,1.0,0.0,0.728084,0.147333,0.420883,0.468
CKA,0.692267,0.093333,0.526463,0.190667,0.652736,0.120667,0.438866,0.358,0.571211,0.147333,0.731956,0.108,0.968782,0.004667,0.877425,0.020667,0.98468,0.003333
ConcentricityDifference,0.553624,0.165333,0.175102,0.508,0.487404,0.203333,0.376105,0.326,0.418151,0.221333,0.304516,0.295333,0.623267,0.115333,0.490097,0.227333,0.41341,0.273333
DistanceCorrelation,0.719894,0.078667,0.59755,0.135333,0.698952,0.107333,0.5332,0.253333,0.55963,0.158,0.757476,0.084,0.985766,0.002667,0.954316,0.008667,0.964203,0.006667
EigenspaceOverlapScore,0.25358,0.328,0.285511,0.256,0.415019,0.146,0.452518,0.333333,0.521768,0.197333,0.476489,0.262,0.655035,0.066667,0.599038,0.101333,0.46509,0.283333
Gulp,0.258547,0.317333,0.293003,0.252,0.415199,0.15,0.667131,0.19,0.202852,0.465333,0.476891,0.26,0.655035,0.066667,0.306402,0.291333,0.462602,0.288
HardCorrelationMatch,0.255907,0.312,0.308416,0.277333,0.397374,0.192,0.554407,0.186,0.604909,0.127333,0.597125,0.133333,0.491916,0.244,0.441535,0.446,0.47035,0.282667
JaccardSimilarity,0.768198,0.036667,0.619864,0.142,0.762113,0.075333,0.695215,0.156667,0.693057,0.119333,0.703485,0.06,0.946856,0.008667,0.97958,0.004667,0.655035,0.066667
LinearRegression,0.609928,0.099333,0.644813,0.082,0.772596,0.060667,0.30705,0.334,0.257079,0.504667,0.685969,0.096,0.747042,0.109333,0.555347,0.186,0.560379,0.167333
MagnitudeDifference,0.535091,0.172667,0.196374,0.468,0.489759,0.210667,0.313769,0.316667,0.600202,0.161333,0.17811,0.517333,0.557636,0.164,0.71963,0.094,1.0,0.0


### Results of Output Correlations

In [11]:
def get_output_correlation_table(experiment, dataset):
    
    path = os.path.join(EXPERIMENT_RESULTS_PATH, FULL_DF_FILE_NAME(experiment, "output_correlation", dataset))
    df = pd.read_csv(path)
    data = df.loc[:, ["similarity_measure", "functional_similarity_measure", "quality_measure", "corr", "architecture"]]
    
    return data.pivot_table(index="similarity_measure", columns=["architecture", "functional_similarity_measure", "quality_measure"], values="corr", aggfunc="mean")

In [12]:
get_output_correlation_table("label_test", "cora")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.509585,-0.916551,-0.670872,-0.535206,-0.884646,-0.688909,-0.379181,-0.810322,-0.525891,-0.371817,-0.793789,-0.516602,-0.412152,-0.898169,-0.574975,-0.443389,-0.83809,-0.610212
CKA,-0.473548,-0.900428,-0.617185,-0.448027,-0.857739,-0.601184,-0.479349,-0.892242,-0.643784,-0.464571,-0.869538,-0.6297,-0.42791,-0.915825,-0.596623,-0.381761,-0.848918,-0.55253
ConcentricityDifference,-0.1059,-0.204555,-0.163648,-0.07728,-0.164305,-0.122245,-0.035688,-0.075679,-0.054454,-0.005663,-0.038142,-0.008911,0.073547,0.138064,0.10538,0.063724,0.174908,0.090975
DistanceCorrelation,-0.468591,-0.923049,-0.611785,-0.45311,-0.880671,-0.603781,-0.500508,-0.915534,-0.668181,-0.511349,-0.897737,-0.678854,-0.392152,-0.922677,-0.555918,-0.468049,-0.872551,-0.630083
EigenspaceOverlapScore,-0.272375,-0.448225,-0.397818,-0.301583,-0.47892,-0.436154,-0.333739,-0.65612,-0.476177,-0.323255,-0.645285,-0.467559,-0.452374,-0.885703,-0.618154,-0.45146,-0.835498,-0.619921
Gulp,0.261033,0.439794,0.382707,0.28981,0.469977,0.421743,0.3299,0.653494,0.474486,0.332352,0.649085,0.480472,0.45474,0.885594,0.619666,0.460691,0.837419,0.628334
HardCorrelationMatch,-0.488105,-0.919895,-0.629989,-0.460468,-0.876687,-0.612355,-0.474618,-0.916649,-0.639947,-0.453556,-0.894043,-0.617839,-0.451972,-0.93031,-0.614179,-0.380647,-0.856009,-0.550111
JaccardSimilarity,-0.534502,-0.764992,-0.697462,-0.535964,-0.728527,-0.697987,-0.498901,-0.853067,-0.666494,-0.460245,-0.825347,-0.624777,-0.461748,-0.857814,-0.623993,-0.364727,-0.786898,-0.522653
LinearRegression,-0.438986,-0.83875,-0.598718,-0.424974,-0.785515,-0.577432,-0.356597,-0.767644,-0.491908,-0.335762,-0.736117,-0.464767,-0.434756,-0.864312,-0.590146,-0.380986,-0.768851,-0.518028
MagnitudeDifference,-0.12537,-0.230291,-0.185317,-0.098729,-0.198162,-0.149061,0.012878,0.015327,0.018682,0.031349,0.034729,0.048306,0.048726,0.143004,0.067037,0.036254,0.126279,0.045031


In [13]:
get_output_correlation_table("label_test", "flickr")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.075699,-0.117805,-0.106484,-0.082096,-0.083086,-0.119403,-0.174759,-0.216776,-0.254891,-0.475942,-0.671375,-0.660939,-0.590132,-0.914541,-0.793491,-0.504526,-0.756979,-0.692169
CKA,-0.007603,0.007734,-0.005532,-0.174493,-0.244961,-0.262611,-0.107193,-0.159039,-0.155703,-0.409944,-0.613291,-0.595409,-0.406779,-0.639896,-0.561853,-0.570078,-0.785473,-0.773238
ConcentricityDifference,-0.037214,-0.08921,-0.060974,0.093556,0.07817,0.141156,0.00747,0.048733,0.012054,0.048652,0.064524,0.071572,0.45303,0.59349,0.647121,0.473088,0.67006,0.673326
DistanceCorrelation,-0.052733,-0.004947,-0.06558,-0.194872,-0.256748,-0.291142,0.022768,-0.051486,0.034173,-0.521249,-0.74373,-0.729528,-0.553247,-0.929313,-0.722766,-0.677458,-0.855416,-0.845032
EigenspaceOverlapScore,0.030971,0.057493,0.041775,-0.011237,0.020557,-0.016646,-0.280057,-0.456417,-0.430112,0.20388,0.111038,0.298193,-0.593611,-0.915811,-0.776732,-0.617703,-0.819038,-0.793591
Gulp,-0.026957,-0.05936,-0.04552,0.251996,0.356353,0.36235,0.053541,0.15721,0.077798,-0.010747,0.020992,-0.013569,0.593656,0.916107,0.777057,0.620245,0.820363,0.795847
HardCorrelationMatch,-0.183752,-0.197044,-0.269195,-0.334181,-0.406197,-0.472265,-0.004304,-0.032861,-0.004773,-0.516165,-0.698386,-0.724729,-0.574165,-0.906239,-0.744398,-0.718172,-0.873563,-0.885004
JaccardSimilarity,-0.145534,-0.081065,-0.221831,-0.238261,-0.293316,-0.350141,-0.272921,-0.376476,-0.417438,-0.164504,-0.103163,-0.266037,-0.536701,-0.84206,-0.711371,-0.615385,-0.744901,-0.794102
LinearRegression,0.006494,0.026687,0.010612,-0.145586,-0.182693,-0.217637,-0.011408,-0.090679,-0.011654,0.01389,-0.038739,0.02185,-0.533701,-0.863957,-0.716297,-0.599421,-0.816182,-0.781338
MagnitudeDifference,-0.051663,-0.092329,-0.076602,-0.1101,-0.166321,-0.164365,0.009165,-0.005925,0.014309,0.310858,0.406163,0.456052,0.182974,0.260688,0.26755,0.312508,0.506858,0.450695


In [14]:
get_output_correlation_table("label_test", "ogbn-arxiv")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.650813,-0.834448,-0.862018,-0.560401,-0.766566,-0.736649,-0.753501,-0.880757,-0.927873,-0.412219,-0.585844,-0.559938,-0.712526,-0.921798,-0.906427,-0.276878,-0.494089,-0.391566
CKA,-0.564533,-0.73785,-0.774701,-0.721828,-0.881106,-0.902226,-0.447358,-0.525307,-0.628396,-0.764236,-0.920409,-0.941568,-0.534372,-0.723384,-0.745787,-0.623278,-0.824721,-0.827975
ConcentricityDifference,0.073137,-0.025403,0.105955,0.461984,0.678243,0.639569,0.02233,-0.073952,0.028141,0.343902,0.32108,0.534598,0.046871,-0.023777,0.065604,0.48058,0.528894,0.692705
DistanceCorrelation,-0.648444,-0.844284,-0.858611,-0.629387,-0.80351,-0.822918,-0.537571,-0.64899,-0.732817,-0.669208,-0.853633,-0.886629,-0.624052,-0.802178,-0.841245,-0.535964,-0.757683,-0.738618
EigenspaceOverlapScore,-0.6847,-0.88354,-0.890176,-0.323969,-0.506115,-0.474025,-0.600184,-0.73999,-0.836244,-0.102876,-0.235597,-0.146856,-0.747612,-0.847237,-0.922562,-0.116789,-0.295089,-0.18326
Gulp,0.683359,0.881338,0.888764,0.391394,0.553236,0.542778,0.515911,0.122537,0.727048,0.133512,0.041163,0.181463,0.757254,0.848638,0.927237,0.130301,0.302382,0.203274
HardCorrelationMatch,-0.687471,-0.910824,-0.891366,-0.505507,-0.644775,-0.669688,-0.757744,-0.829691,-0.930964,-0.446778,-0.661899,-0.621862,-0.768101,-0.873212,-0.938249,-0.368963,-0.60368,-0.525924
JaccardSimilarity,-0.692925,-0.836132,-0.895709,-0.470903,-0.633999,-0.675379,-0.753054,-0.834614,-0.928918,-0.402185,-0.580846,-0.589277,-0.760379,-0.916531,-0.926862,-0.185686,-0.338541,-0.26603
LinearRegression,-0.635418,-0.852553,-0.856289,-0.277126,-0.408234,-0.42512,-0.536497,-0.721674,-0.745902,-0.092932,-0.178525,-0.126143,-0.740721,-0.867739,-0.918763,-0.152192,-0.290474,-0.229648
MagnitudeDifference,0.007555,-0.084838,0.009174,0.025909,-0.087285,0.035644,-0.082576,-0.14941,-0.120976,0.05369,0.011906,0.087,0.254308,0.475428,0.394629,0.106622,0.1348,0.163667


In [15]:
get_output_correlation_table("shortcut_test", "cora")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.084346,0.142265,0.113742,0.035452,0.04724,0.039324,-0.241805,-0.350989,-0.348876,-0.249008,-0.346518,-0.356693,0.092716,0.140225,0.142874,0.015028,0.031096,0.028863
CKA,-0.061072,-0.087849,-0.088566,-0.097748,-0.170038,-0.140643,-0.335741,-0.497786,-0.476726,-0.355897,-0.506638,-0.504341,-0.231388,-0.35258,-0.343904,-0.29262,-0.430762,-0.427375
ConcentricityDifference,-0.111916,-0.165641,-0.165593,-0.073534,-0.075348,-0.109595,0.176583,0.213249,0.266522,0.205931,0.241613,0.312791,-0.065875,-0.101735,-0.097933,-0.021093,-0.040942,-0.030195
DistanceCorrelation,-0.059953,-0.084395,-0.088791,-0.096499,-0.168136,-0.140059,-0.349135,-0.51068,-0.493765,-0.377525,-0.52802,-0.532597,-0.243804,-0.366627,-0.364798,-0.294627,-0.425513,-0.43229
EigenspaceOverlapScore,-0.029473,-0.278845,-0.05495,-0.076477,-0.280811,-0.126497,-0.086813,-0.173359,-0.133231,-0.062074,-0.148223,-0.098712,0.024697,0.027379,0.034852,-0.034916,-0.077886,-0.048109
Gulp,0.02437,0.277664,0.047559,0.074381,0.280183,0.12262,0.063072,0.132466,0.097678,0.049855,0.115011,0.08195,-0.006922,-0.01124,-0.006718,0.052174,0.094337,0.074544
HardCorrelationMatch,-0.269552,-0.391527,-0.380577,-0.317547,-0.401708,-0.448451,-0.245971,-0.303149,-0.353785,-0.255786,-0.298706,-0.371868,-0.216293,-0.326298,-0.317133,-0.280847,-0.406139,-0.406429
JaccardSimilarity,-0.08439,-0.207227,-0.127164,-0.127982,-0.234752,-0.193739,-0.305101,-0.418021,-0.43514,-0.315229,-0.411818,-0.455192,-0.098254,-0.149201,-0.151059,-0.160758,-0.264918,-0.242593
LinearRegression,-0.09787,-0.138093,-0.143012,-0.133601,-0.178021,-0.197584,-0.180475,-0.259206,-0.260681,-0.166271,-0.217019,-0.242733,-0.105501,-0.127213,-0.157488,-0.186689,-0.256215,-0.274516
MagnitudeDifference,-0.024639,-0.032036,-0.034505,0.007982,0.049213,0.008663,0.219228,0.303063,0.326785,0.271037,0.362033,0.402784,0.082399,0.116923,0.125951,0.105463,0.149789,0.156968


In [16]:
get_output_correlation_table("shortcut_test", "flickr")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.191678,-0.310566,-0.280539,-0.177079,-0.288528,-0.261045,-0.086544,-0.132072,-0.132732,-0.123032,-0.141067,-0.187099,-0.513029,-0.80114,-0.681401,-0.542386,-0.765174,-0.702198
CKA,0.080498,0.112315,0.118377,0.051327,0.064812,0.072535,-0.057376,-0.089652,-0.085364,-0.084994,-0.074027,-0.130309,-0.360403,-0.496312,-0.504378,-0.382787,-0.429925,-0.524492
ConcentricityDifference,-0.007983,-0.063764,-0.02328,0.018239,-0.005721,0.02127,0.005196,-0.009772,0.008768,0.012263,-0.031034,0.020808,0.717572,0.928839,0.894009,0.72495,0.954498,0.900782
DistanceCorrelation,0.028364,0.087908,0.042061,-0.007581,0.026023,-0.016858,-0.088283,-0.155947,-0.138578,-0.085084,-0.09823,-0.133558,-0.344525,-0.562446,-0.483358,-0.367447,-0.512464,-0.503502
EigenspaceOverlapScore,-0.049191,-0.121116,-0.071692,-0.03175,-0.104547,-0.046357,-0.045022,-0.074239,-0.070266,-0.086778,-0.106176,-0.132185,-0.413389,-0.481281,-0.556337,-0.433846,-0.424546,-0.574597
Gulp,0.316238,0.475386,0.48307,0.335072,0.503631,0.506488,0.03026,0.026846,0.043074,0.012174,-0.014188,0.017807,-0.060814,0.223891,-0.195507,-0.040089,0.112763,-0.17781
HardCorrelationMatch,-0.316416,-0.520786,-0.483867,-0.354337,-0.573153,-0.527278,-0.095642,-0.147096,-0.148683,-0.121382,-0.159825,-0.193319,-0.47494,-0.742214,-0.654679,-0.499844,-0.679264,-0.673611
JaccardSimilarity,-0.454489,-0.711051,-0.658291,-0.446555,-0.706316,-0.653904,-0.070845,-0.12904,-0.10895,-0.099844,-0.181103,-0.15698,-0.273564,-0.445484,-0.378247,-0.297614,-0.319966,-0.398857
LinearRegression,-0.008879,0.014951,-0.009993,-0.027313,-0.011334,-0.039584,-0.003231,0.099121,-0.005681,0.028304,0.1419,0.041821,-0.15944,-0.265828,-0.22553,-0.182712,-0.181173,-0.250872
MagnitudeDifference,-0.044998,-0.107515,-0.070391,-0.030591,-0.053344,-0.050638,0.049527,0.074236,0.070813,0.066667,0.087092,0.096026,0.637066,0.873031,0.841242,0.628629,0.925754,0.832511


In [17]:
get_output_correlation_table("shortcut_test", "ogbn-arxiv")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.494406,-0.705029,-0.687399,-0.606867,-0.829893,-0.804341,-0.478893,-0.70505,-0.668754,-0.523032,-0.784156,-0.705931,-0.485821,-0.594536,-0.654684,-0.454582,-0.605572,-0.625864
CKA,-0.491417,-0.68437,-0.688332,-0.602051,-0.821893,-0.802772,-0.604834,-0.815317,-0.80293,-0.657258,-0.903695,-0.840611,-0.367393,-0.214818,-0.459029,-0.339041,-0.217113,-0.427015
ConcentricityDifference,0.102192,0.106593,0.165442,0.161962,0.134704,0.253512,0.363123,0.546285,0.53986,0.408339,0.604903,0.598688,0.81385,0.9553,0.955258,0.781182,0.953046,0.9401
DistanceCorrelation,-0.46438,-0.655172,-0.655421,-0.565307,-0.792375,-0.765802,-0.608091,-0.81421,-0.805405,-0.657659,-0.905582,-0.841552,-0.356554,-0.272685,-0.453674,-0.327001,-0.277578,-0.42035
EigenspaceOverlapScore,-0.489677,-0.713961,-0.677148,-0.605619,-0.830569,-0.795505,-0.498344,-0.580287,-0.695839,-0.547871,-0.665981,-0.74379,-0.708849,-0.886309,-0.887684,-0.682542,-0.892117,-0.864802
Gulp,0.488205,0.713027,0.675828,0.602809,0.829105,0.79298,0.436109,0.530252,0.621216,0.482319,0.608299,0.662838,0.463831,0.409743,0.624452,0.438796,0.403046,0.593152
HardCorrelationMatch,-0.523406,-0.746359,-0.716494,-0.618149,-0.853872,-0.808571,-0.365666,-0.429009,-0.532186,-0.409944,-0.50435,-0.572619,-0.466596,-0.442217,-0.599404,-0.434337,-0.446342,-0.566279
JaccardSimilarity,-0.497574,-0.703004,-0.683402,-0.601873,-0.824198,-0.78558,-0.602157,-0.821936,-0.803491,-0.64981,-0.883104,-0.837334,-0.445275,-0.366385,-0.611193,-0.41204,-0.362234,-0.579861
LinearRegression,-0.426012,-0.553682,-0.60308,-0.509229,-0.645272,-0.703691,-0.4279,-0.599427,-0.607009,-0.45242,-0.670941,-0.629959,-0.100613,0.005919,-0.143357,-0.073896,-0.005419,-0.104285
MagnitudeDifference,0.245229,0.31046,0.375611,0.32223,0.386105,0.488033,0.203321,0.295021,0.306208,0.198261,0.270803,0.298448,0.207037,0.007953,0.310186,0.193712,-0.002602,0.287822


In [18]:
get_output_correlation_table("augmentation_test", "cora")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.204598,0.234288,0.250005,-0.022222,-0.085014,0.042424,-0.26968,-0.444145,-0.328269,-0.288889,-0.401172,-0.369697,0.179787,0.407533,0.25532,-0.377778,-0.261401,-0.563636
CKA,0.159132,0.156891,0.152442,-0.333333,-0.4505,-0.454545,-0.179787,-0.432928,-0.267478,-0.244444,-0.544134,-0.393939,0.089893,0.173408,0.151976,-0.466667,-0.42031,-0.612121
ConcentricityDifference,-0.295531,-0.459046,-0.475619,-0.066667,-0.028583,-0.090909,0.0,0.038238,0.012158,-0.111111,-0.024804,-0.163636,0.044947,-0.030425,0.079028,-0.155556,-0.236169,-0.309091
DistanceCorrelation,0.159132,0.11588,0.152442,-0.333333,-0.476871,-0.454545,-0.224733,-0.517919,-0.291795,-0.333333,-0.596473,-0.418182,-0.044947,0.0316,-0.006079,-0.511111,-0.559428,-0.648485
EigenspaceOverlapScore,0.068199,0.01087,0.067074,-0.244444,-0.528755,-0.284848,0.179787,0.103494,0.218846,0.288889,0.322481,0.393939,-0.224733,-0.234075,-0.376901,-0.688889,-0.796131,-0.781818
Gulp,-0.113666,-0.003025,-0.07927,0.288889,0.60044,0.381818,-0.179787,-0.050501,-0.224925,-0.288889,-0.262299,-0.418182,0.314627,0.286335,0.504562,0.777778,0.85935,0.866667
HardCorrelationMatch,-0.204598,-0.398758,-0.310981,-0.288889,-0.38243,-0.357576,-0.179787,-0.524525,-0.346506,-0.244444,-0.524963,-0.357576,-0.13484,-0.152698,-0.164134,-0.422222,-0.577564,-0.612121
JaccardSimilarity,-0.113666,-0.125135,-0.140247,0.155556,0.010643,0.2,-0.6742,-0.784963,-0.741645,-0.6,-0.728129,-0.781818,0.044947,-0.05827,-0.012158,-0.6,-0.654824,-0.745455
LinearRegression,0.298712,0.270406,0.362964,0.216295,0.238555,0.307927,-0.240613,-0.375924,-0.31492,-0.22711,-0.349925,-0.307927,-0.142181,-0.232277,-0.210452,-0.551553,-0.667256,-0.697363
MagnitudeDifference,-0.340997,-0.415221,-0.451228,-0.288889,-0.193101,-0.369697,-0.044947,-0.055668,-0.036474,-0.155556,-0.141509,-0.236364,0.0,-0.130573,0.006079,-0.288889,-0.372199,-0.345455


In [19]:
get_output_correlation_table("augmentation_test", "flickr")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.271691,-0.377773,-0.40112,-0.410479,-0.574452,-0.582532,-0.246544,-0.168841,-0.369278,-0.276566,-0.175408,-0.396806,-0.558819,-0.774821,-0.738477,-0.64214,-0.829531,-0.838249
CKA,-0.096064,-0.208925,-0.14908,-0.162542,-0.337277,-0.238281,-0.270939,-0.348259,-0.398087,-0.394426,-0.328926,-0.55729,-0.570329,-0.773743,-0.752002,-0.830769,-0.960698,-0.963217
ConcentricityDifference,0.187892,0.240331,0.27538,0.23398,0.255272,0.338894,0.076398,0.056254,0.121207,0.054404,0.061732,0.084828,0.028754,0.050215,0.043245,-0.067826,-0.107853,-0.100758
DistanceCorrelation,-0.22696,-0.283499,-0.338588,-0.324326,-0.447187,-0.476038,-0.199447,-0.208134,-0.293297,-0.307559,-0.215063,-0.414698,-0.583669,-0.796334,-0.765426,-0.814404,-0.953151,-0.955005
EigenspaceOverlapScore,-0.237351,-0.327099,-0.359101,-0.281695,-0.397515,-0.416631,-0.241682,-0.329432,-0.357847,-0.470502,-0.386312,-0.663211,-0.512687,-0.64903,-0.691481,-0.788004,-0.818767,-0.941336
Gulp,0.307771,0.387008,0.430528,0.478172,0.642937,0.648993,-0.012086,-0.056925,-0.019846,-0.048473,-0.108029,-0.070109,0.513758,0.649946,0.692457,0.789253,0.818863,0.941594
HardCorrelationMatch,-0.335734,-0.448182,-0.487163,-0.465596,-0.627715,-0.637693,-0.342967,-0.438603,-0.497091,-0.476031,-0.438001,-0.644055,-0.557168,-0.752962,-0.736323,-0.815117,-0.935311,-0.953469
JaccardSimilarity,-0.360129,-0.394317,-0.487002,-0.476433,-0.598656,-0.641084,-0.300107,-0.371427,-0.450981,-0.422074,-0.375958,-0.589366,-0.589781,-0.752075,-0.768382,-0.753668,-0.879063,-0.918161
LinearRegression,-0.094842,-0.097058,-0.143719,-0.18215,-0.23698,-0.260674,0.034424,-0.025315,0.05537,0.02963,-0.033827,0.058414,-0.461965,-0.658084,-0.639218,-0.724155,-0.887786,-0.903254
MagnitudeDifference,0.13201,0.160847,0.196387,0.109298,0.130463,0.170528,0.057756,-0.031929,0.086353,-0.026934,-0.080743,-0.043596,0.07377,0.119153,0.106635,0.079599,0.118734,0.114531


### CD Plots

In [34]:
# autorank package needed for creation of CD plots 
from autorank import autorank, plot_stats, create_report, latex_table
from autorank._util import *
from matplotlib import pyplot as plt

In [39]:
def get_figsize(columnwidth, wf=0.5, hf=(5. ** 0.5 - 1.0) / 2.0):
    """ Credit: https://stackoverflow.com/a/31527287
    Parameters:
      - wf [float]:  width fraction in columnwidth units
      - hf [float]:  height fraction in columnwidth units.
                     Set by default to golden ratio.
      - columnwidth [float]: width of the column in latex. Get this from LaTeX
                             using \showthe\columnwidth
    Returns:  [fig_width,fig_height]: that should be given to matplotlib
    """
    fig_width_pt = columnwidth * wf
    inches_per_pt = 1.0 / 72.27  # Convert pt to inch
    fig_width = fig_width_pt * inches_per_pt  # width in inches
    fig_height = fig_width * hf  # height in inches
    return fig_width, fig_height

PLOTS_BASE_WIDTH = 433.62  # pt
PLOTS_CD_WIDTH, PLOTS_CD_HEIGHT = get_figsize(PLOTS_BASE_WIDTH, wf=1.5)

In [28]:
def get_autorank_df(experiments=EXPERIMENTS, datasets=DATASETS, architectures=ARCHITECTURES, quality_measure = "violation_rate"):
    dfs = []
    for experiment in experiments:
        for dataset in datasets:
            path = os.path.join(EXPERIMENT_RESULTS_PATH, FULL_DF_FILE_NAME(experiment, COMPARISON_TYPE_DICT[experiment], dataset))
            df = pd.read_csv(path)
            df["experiment"] = experiment
            data = df.loc[:, ["similarity_measure", "quality_measure", "value", "architecture", "representation_dataset", "experiment"]]
            data = data.loc[data.loc[:,"architecture"].isin(architectures)]
            data = data.loc[data.loc[:,"quality_measure"]==quality_measure]
            dfs.append(data)
            
    df_cc = pd.concat(dfs, axis=0)
    df_res = df_cc.pivot_table(index="similarity_measure", columns=["experiment", "representation_dataset", "architecture"], values="value", aggfunc="mean")
    return df_res.transpose()

In [38]:
res_df = get_autorank_df()
result = autorank(-res_df, alpha=0.05, verbose=False)
cd_diagram(result, False, None, PLOTS_CD_WIDTH)
fig = plt.gcf()
fig.set_size_inches(PLOTS_CD_WIDTH, PLOTS_CD_HEIGHT)
plt.savefig(f"cd_test.png", bbox_inches="tight")
plt.close()

  if abs(sorted_ranks[i] - sorted_ranks[j]) <= critical_difference:
  plot_line([(rankpos(sorted_ranks[i]), cline),
  (rankpos(sorted_ranks[i]), chei),
  plot_line([(rankpos(sorted_ranks[i]), cline),
  (rankpos(sorted_ranks[i]), chei),
  plot_line([(rankpos(sorted_ranks[l]) - side, start),
  (rankpos(sorted_ranks[r]) + side, start)],
