In [1]:
import pandas as pd
import itertools
import os

### Results for Group Separation Experiments

In [2]:
EXPERIMENT_RESULTS_PATH = 'C:/Users/Tobias/Eigene Dokumente/Research/similaritybench/experiments/results'
COMPARISON_TYPE_DICT = {
    "label_test": "group_separation",
    "layer_test": "monotonicity",
    "augmentation_test": "group_separation",
    "shortcut_test": "group_separation"
}

EXPERIMENTS = list(COMPARISON_TYPE_DICT.keys())
DATASETS = ["cora", "flickr", "ogbn-arxiv"]
ARCHITECTURES = ["GCN", "GraphSAGE", "GAT"]

def FULL_DF_FILE_NAME(experiment, comparison_type, dataset, groups=5):
    if groups < 5:
        return f"{experiment}_{comparison_type}_{dataset}_{groups}groups_full.csv"
    return f"{experiment}_{comparison_type}_{dataset}_full.csv"

In [3]:
def get_pivot_table(experiment, dataset):
    path = os.path.join(EXPERIMENT_RESULTS_PATH, FULL_DF_FILE_NAME(experiment, COMPARISON_TYPE_DICT[experiment], dataset))
    
    df = pd.read_csv(path)
    data = df.loc[:, ["similarity_measure", "quality_measure", "value", "architecture", "representation_dataset"]]
    return data.pivot(index="similarity_measure", columns=["representation_dataset", "architecture", "quality_measure"], values="value")

In [4]:
def get_agg_pivot_table(experiment, datasets, groups=5):
    dfs = []
    for dataset in datasets:
        path = os.path.join(EXPERIMENT_RESULTS_PATH, FULL_DF_FILE_NAME(experiment, COMPARISON_TYPE_DICT[experiment], dataset, groups))
        df = pd.read_csv(path)
        data = df.loc[:, ["similarity_measure", "quality_measure", "value", "architecture", "representation_dataset"]]
        dfs.append(data.iloc[:])
    df_cc = pd.concat(dfs, axis=0)
    return df_cc.pivot_table(index="similarity_measure", columns=["representation_dataset", "architecture", "quality_measure"], values="value", aggfunc="mean")

In [5]:
get_agg_pivot_table("label_test", ["cora", "flickr", "ogbn-arxiv"])

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.278104,0.4274,0.288519,0.4144,0.286776,0.3894,0.183,0.3986,0.512503,0.1452,0.27535,0.4924,0.458743,0.1956,0.46719,0.1984,0.463974,0.3484
CKA,0.274075,0.489,0.27332,0.477,0.27427,0.4728,0.141352,0.4304,0.444654,0.1416,0.414902,0.2218,0.728493,0.0528,0.845622,0.0208,0.800192,0.0264
ConcentricityDifference,0.212224,0.36,0.130831,0.495,0.197968,0.328,0.155735,0.43,0.217569,0.3468,0.234506,0.245,0.505337,0.1244,0.517715,0.1438,0.543354,0.1188
DistanceCorrelation,0.274465,0.4788,0.279556,0.427,0.286791,0.3972,0.116486,0.4538,0.490598,0.1226,0.307658,0.3542,0.722406,0.0606,0.803678,0.0308,0.822388,0.03
EigenspaceOverlapScore,0.132407,0.4564,0.159799,0.4566,0.167978,0.4802,0.122764,0.4708,0.268285,0.4872,0.284428,0.4264,0.222376,0.5052,0.17005,0.4862,0.276237,0.4742
Gulp,0.133022,0.45,0.159822,0.4478,0.168366,0.4784,0.117774,0.4446,0.106238,0.4938,0.284515,0.4282,0.196729,0.4764,0.193893,0.503,0.276737,0.4678
HardCorrelationMatch,0.270146,0.4996,0.271684,0.4832,0.273245,0.4738,0.191036,0.3742,0.388817,0.1482,0.332226,0.2882,0.33392,0.3244,0.520203,0.1628,0.515477,0.1518
JaccardSimilarity,0.27443,0.4624,0.272676,0.4754,0.273044,0.4904,0.131045,0.439,0.325568,0.2498,0.296303,0.3712,0.3849,0.2034,0.565453,0.1096,0.282764,0.4858
LinearRegression,0.285519,0.3986,0.282033,0.411,0.284103,0.4294,0.124955,0.4824,0.129515,0.53,0.326034,0.3,0.297404,0.4372,0.279106,0.431,0.366826,0.3302
MagnitudeDifference,0.185056,0.3594,0.119458,0.5024,0.133759,0.4004,0.110165,0.509,0.410339,0.1926,0.273394,0.214,0.171858,0.3546,0.270191,0.299,0.198566,0.332


In [7]:
# get_agg_pivot_table("label_test", ["cora", "flickr", "ogbn-arxiv"], groups=3)

In [None]:
# get_agg_pivot_table("label_test", ["cora", "flickr", "ogbn-arxiv"], groups=2)

In [6]:
get_agg_pivot_table("layer_test", ["cora", "flickr", "ogbn-arxiv"])

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate,correlation,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.782823,0.107143,0.962483,0.044048,0.846429,0.094048,0.483333,0.279762,0.507279,0.392857,0.727347,0.195238,0.50915,0.222619,0.924082,0.091667,0.589252,0.259524
CKA,0.983435,0.028571,0.959354,0.057143,0.991667,0.015476,0.52432,0.265476,0.38619,0.338095,0.875918,0.115476,0.870986,0.114286,0.808435,0.107143,0.959252,0.064286
ConcentricityDifference,0.612075,0.122619,0.787925,0.142857,0.021088,0.482143,0.623742,0.186905,0.381701,0.457143,0.015918,0.488095,0.392666,0.236905,0.524626,0.35119,0.393197,0.416667
DistanceCorrelation,0.990578,0.016667,0.99949,0.00119,0.99966,0.00119,0.493435,0.270238,0.615374,0.230952,0.977585,0.025,0.871327,0.103571,0.785204,0.138095,0.932721,0.096429
EigenspaceOverlapScore,1.0,0.0,1.0,0.0,1.0,0.0,0.80646,0.084524,0.983333,0.022619,0.953231,0.021429,0.916167,0.061905,0.783163,0.054762,0.98534,0.016667
Gulp,0.924694,0.022619,0.959966,0.019048,1.0,0.0,0.414456,0.359524,0.539796,0.271429,0.815714,0.077381,0.49915,0.291667,0.827313,0.109524,0.995578,0.011905
HardCorrelationMatch,0.902415,0.065476,0.937143,0.041667,0.947925,0.058333,0.651122,0.179762,0.524966,0.270238,0.74898,0.194048,0.940408,0.072619,0.914048,0.089286,0.874796,0.127381
JaccardSimilarity,0.998299,0.005952,1.0,0.0,0.99966,0.00119,0.918776,0.086905,0.957279,0.021429,0.970068,0.044048,0.979932,0.022619,0.988265,0.022619,0.957483,0.064286
LinearRegression,0.706701,0.113095,0.886088,0.033333,1.0,0.0,0.198537,0.425,0.265306,0.390476,0.8,0.05119,0.224286,0.388095,0.997449,0.008333,0.99932,0.002381
MagnitudeDifference,0.930408,0.079762,0.444524,0.377381,0.543299,0.360714,0.546395,0.371429,0.608639,0.320238,0.296565,0.390476,0.410102,0.294048,0.573163,0.292857,0.679388,0.152381


In [7]:
get_agg_pivot_table("shortcut_test", ["cora", "flickr", "ogbn-arxiv"])

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.116701,0.4952,0.144859,0.4022,0.210714,0.2494,0.35997,0.338,0.299808,0.2008,0.527227,0.0864,0.566886,0.1088,0.383656,0.1406,0.944316,0.0084
CKA,0.226215,0.4034,0.134421,0.4016,0.303313,0.198,0.117855,0.4684,0.123737,0.4634,0.46545,0.1062,0.579315,0.0796,0.444151,0.1314,0.873149,0.0322
ConcentricityDifference,0.095087,0.5468,0.151224,0.5348,0.094332,0.573,0.154738,0.3804,0.137792,0.522,0.458561,0.1086,0.391127,0.1934,0.303171,0.327,0.711618,0.0552
DistanceCorrelation,0.221667,0.4104,0.142364,0.3862,0.370273,0.177,0.128919,0.4312,0.175935,0.33,0.460491,0.1126,0.564012,0.0904,0.44317,0.132,0.884731,0.0266
EigenspaceOverlapScore,0.084755,0.5932,0.107221,0.4662,0.187584,0.3808,0.281368,0.404,0.140166,0.3292,0.319582,0.2624,0.411037,0.1702,0.244117,0.2108,0.527321,0.0588
Gulp,0.08826,0.5852,0.103083,0.4828,0.187679,0.3768,0.16114,0.356,0.110683,0.533,0.277657,0.4064,0.411573,0.1682,0.225199,0.2304,0.462335,0.103
HardCorrelationMatch,0.107221,0.4652,0.095984,0.5066,0.180108,0.2854,0.332267,0.2788,0.208394,0.2648,0.546456,0.0892,0.442824,0.1052,0.216439,0.2564,0.703211,0.0278
JaccardSimilarity,0.172286,0.346,0.144966,0.3994,0.346899,0.2174,0.308633,0.285,0.430379,0.119,0.385761,0.1678,0.508573,0.1324,0.455164,0.1236,0.971198,0.0032
LinearRegression,0.157208,0.418,0.13934,0.4376,0.363778,0.175,0.159012,0.4262,0.192686,0.3388,0.356119,0.2138,0.500928,0.1018,0.343531,0.2012,0.561853,0.069
MagnitudeDifference,0.091114,0.5432,0.137015,0.5326,0.090777,0.5716,0.13329,0.4308,0.127935,0.4626,0.569959,0.1374,0.383388,0.1804,0.162774,0.3482,0.296801,0.1894


In [8]:
get_agg_pivot_table("shortcut_test", ["cora", "flickr", "ogbn-arxiv"], groups=3)

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.302898,0.411333,0.318647,0.305333,0.598752,0.118667,0.479826,0.231333,0.894714,0.019333,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
CKA,0.46266,0.364,0.272784,0.338667,0.776866,0.096667,0.330272,0.348,0.281582,0.428,1.0,0.0,1.0,0.0,1.0,0.0,0.981104,0.004
ConcentricityDifference,0.204222,0.502,0.182471,0.532,0.168895,0.573333,0.324453,0.392667,0.182249,0.503333,0.176244,0.536667,1.0,0.0,0.814892,0.036667,0.961912,0.009333
DistanceCorrelation,0.459166,0.378,0.283945,0.312,0.819571,0.084,0.31707,0.282,0.332822,0.313333,1.0,0.0,1.0,0.0,1.0,0.0,0.994444,0.001333
EigenspaceOverlapScore,0.163367,0.575333,0.216938,0.426,0.495157,0.26,0.544425,0.190667,0.460572,0.128,0.432888,0.4,0.968069,0.007333,1.0,0.0,0.724314,0.166667
Gulp,0.172056,0.560667,0.197004,0.474667,0.495904,0.260667,0.451336,0.189333,0.196031,0.508,0.432888,0.4,0.964558,0.008667,0.985766,0.002667,0.724314,0.166667
HardCorrelationMatch,0.219276,0.418667,0.200268,0.441333,0.347125,0.232,0.518523,0.192,0.549104,0.171333,1.0,0.0,0.834909,0.030667,0.798304,0.038667,0.724314,0.166667
JaccardSimilarity,0.379688,0.286,0.305227,0.303333,0.782344,0.070667,0.544567,0.16,1.0,0.0,0.827864,0.037333,1.0,0.0,1.0,0.0,1.0,0.0
LinearRegression,0.333709,0.376,0.299139,0.383333,0.741737,0.053333,0.356838,0.277333,0.365108,0.297333,0.609064,0.188667,1.0,0.0,1.0,0.0,1.0,0.0
MagnitudeDifference,0.187117,0.511333,0.267258,0.519333,0.151357,0.585333,0.197894,0.523333,0.265917,0.330667,0.782998,0.114,1.0,0.0,0.549767,0.18,0.534647,0.176


In [9]:
get_agg_pivot_table("shortcut_test", ["cora", "flickr", "ogbn-arxiv"], groups=2)

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.66533,0.222,0.874622,0.06,0.990455,0.004,0.742882,0.144,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
CKA,0.705339,0.248,0.722758,0.164,1.0,0.0,0.657604,0.268,0.508512,0.366,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
ConcentricityDifference,0.314367,0.488,0.281132,0.572,0.312316,0.56,0.489947,0.424,0.349786,0.47,0.35855,0.522,1.0,0.0,1.0,0.0,1.0,0.0
DistanceCorrelation,0.69799,0.258,0.809019,0.13,1.0,0.0,0.599373,0.184,0.684121,0.214,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
EigenspaceOverlapScore,0.312005,0.534,0.424569,0.298,0.945988,0.02,0.917832,0.03,1.0,0.0,0.586471,0.5,1.0,0.0,1.0,0.0,1.0,0.0
Gulp,0.323929,0.522,0.350839,0.384,0.937426,0.024,0.964513,0.014,0.35089,0.472,0.586471,0.5,1.0,0.0,1.0,0.0,1.0,0.0
HardCorrelationMatch,0.435479,0.262,0.424195,0.306,1.0,0.0,0.991667,0.004,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
JaccardSimilarity,0.814496,0.056,0.833766,0.076,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
LinearRegression,0.663351,0.226,0.662758,0.2,1.0,0.0,0.568894,0.176,0.529696,0.298,0.827126,0.066,1.0,0.0,1.0,0.0,1.0,0.0
MagnitudeDifference,0.297931,0.51,0.484281,0.53,0.263754,0.58,0.325976,0.538,0.655344,0.132,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0


In [10]:
get_agg_pivot_table("augmentation_test", ["cora", "flickr", "ogbn-arxiv"])

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.318522,0.1632,0.207385,0.3348,0.312604,0.2764,0.446083,0.1934,0.778233,0.0486,0.268233,0.1868,0.666762,0.0694,0.314428,0.1524,0.170511,0.5114
CKA,0.4606,0.1036,0.317196,0.2336,0.333912,0.2136,0.265392,0.2368,0.709564,0.072,0.344698,0.1488,0.624002,0.0804,0.601516,0.0738,0.641648,0.0486
ConcentricityDifference,0.295782,0.272,0.104738,0.4934,0.302124,0.3558,0.256244,0.2692,0.207509,0.342,0.177893,0.3868,0.28711,0.2508,0.176589,0.2992,0.247733,0.2402
DistanceCorrelation,0.459842,0.0962,0.379922,0.203,0.336485,0.2138,0.335817,0.1934,0.712017,0.0636,0.37051,0.1694,0.64295,0.0744,0.590567,0.0792,0.630703,0.058
EigenspaceOverlapScore,0.13624,0.3412,0.28167,0.276,0.323527,0.233,0.30242,0.3024,0.39682,0.1648,0.230607,0.3414,0.465295,0.093,0.370129,0.1654,0.175369,0.4192
Gulp,0.13772,0.3356,0.208459,0.3316,0.32573,0.2248,0.461513,0.1608,0.120003,0.4862,0.237659,0.3358,0.502276,0.1018,0.147723,0.357,0.176144,0.415
HardCorrelationMatch,0.27659,0.32,0.24261,0.2794,0.321632,0.2398,0.44405,0.168,0.690223,0.0724,0.304996,0.2224,0.183786,0.3892,0.13938,0.502,0.147947,0.4236
JaccardSimilarity,0.473244,0.0814,0.377175,0.1826,0.35417,0.182,0.538607,0.1342,0.845712,0.0346,0.45899,0.1526,0.757831,0.0314,0.565698,0.0526,0.43893,0.1136
LinearRegression,0.406563,0.1034,0.457112,0.0962,0.379176,0.1488,0.284078,0.2612,0.18614,0.4664,0.345037,0.2196,0.495116,0.0976,0.228578,0.2646,0.205284,0.2784
MagnitudeDifference,0.347075,0.2624,0.128169,0.4514,0.172646,0.3912,0.270037,0.342,0.459951,0.165,0.094245,0.5398,0.392566,0.1638,0.403656,0.1916,0.994667,0.0006


In [13]:
# get_agg_pivot_table("augmentation_test", ["cora", "flickr", "ogbn-arxiv"], groups=3)

In [11]:
get_agg_pivot_table("augmentation_test", ["cora", "flickr", "ogbn-arxiv"], groups=2)

representation_dataset,cora,cora,cora,cora,cora,cora,flickr,flickr,flickr,flickr,flickr,flickr,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv,ogbn-arxiv
architecture,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE,GAT,GAT,GCN,GCN,GraphSAGE,GraphSAGE
quality_measure,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate,AUPRC,violation_rate
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,1.0,0.0,0.978916,0.01,0.990455,0.004,0.898626,0.048,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.593087,0.438
CKA,1.0,0.0,1.0,0.0,1.0,0.0,0.827348,0.108,0.995455,0.002,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
ConcentricityDifference,0.90603,0.05,0.306338,0.474,0.87978,0.088,0.807932,0.208,0.882173,0.066,0.51673,0.248,0.784275,0.108,0.899343,0.05,0.988462,0.006
DistanceCorrelation,1.0,0.0,1.0,0.0,1.0,0.0,0.924142,0.042,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
EigenspaceOverlapScore,0.995455,0.002,0.995455,0.002,1.0,0.0,0.671069,0.186,0.946245,0.03,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
Gulp,0.995455,0.002,0.808423,0.08,1.0,0.0,1.0,0.0,0.360461,0.44,1.0,0.0,1.0,0.0,0.796613,0.074,1.0,0.0
HardCorrelationMatch,0.985714,0.008,1.0,0.0,1.0,0.0,0.990455,0.004,1.0,0.0,1.0,0.0,0.995455,0.002,0.586471,0.5,1.0,0.0
JaccardSimilarity,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
LinearRegression,1.0,0.0,1.0,0.0,1.0,0.0,0.753612,0.132,0.346558,0.476,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0
MagnitudeDifference,1.0,0.0,0.360337,0.516,0.447093,0.298,0.626781,0.308,1.0,0.0,0.320304,0.546,1.0,0.0,1.0,0.0,1.0,0.0


### Results of Output Correlations

In [11]:
def get_output_correlation_table(experiment, dataset):
    
    path = os.path.join(EXPERIMENT_RESULTS_PATH, FULL_DF_FILE_NAME(experiment, "output_correlation", dataset))
    df = pd.read_csv(path)
    data = df.loc[:, ["similarity_measure", "functional_similarity_measure", "quality_measure", "corr", "architecture"]]
    
    return data.pivot_table(index="similarity_measure", columns=["architecture", "functional_similarity_measure", "quality_measure"], values="corr", aggfunc="mean")

In [12]:
get_output_correlation_table("label_test", "cora")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.509585,-0.916551,-0.670872,-0.535206,-0.884646,-0.688909,-0.379181,-0.810322,-0.525891,-0.371817,-0.793789,-0.516602,-0.412152,-0.898169,-0.574975,-0.443389,-0.83809,-0.610212
CKA,-0.473548,-0.900428,-0.617185,-0.448027,-0.857739,-0.601184,-0.479349,-0.892242,-0.643784,-0.464571,-0.869538,-0.6297,-0.42791,-0.915825,-0.596623,-0.381761,-0.848918,-0.55253
ConcentricityDifference,-0.1059,-0.204555,-0.163648,-0.07728,-0.164305,-0.122245,-0.035688,-0.075679,-0.054454,-0.005663,-0.038142,-0.008911,0.073547,0.138064,0.10538,0.063724,0.174908,0.090975
DistanceCorrelation,-0.468591,-0.923049,-0.611785,-0.45311,-0.880671,-0.603781,-0.500508,-0.915534,-0.668181,-0.511349,-0.897737,-0.678854,-0.392152,-0.922677,-0.555918,-0.468049,-0.872551,-0.630083
EigenspaceOverlapScore,-0.272375,-0.448225,-0.397818,-0.301583,-0.47892,-0.436154,-0.333739,-0.65612,-0.476177,-0.323255,-0.645285,-0.467559,-0.452374,-0.885703,-0.618154,-0.45146,-0.835498,-0.619921
Gulp,0.261033,0.439794,0.382707,0.28981,0.469977,0.421743,0.3299,0.653494,0.474486,0.332352,0.649085,0.480472,0.45474,0.885594,0.619666,0.460691,0.837419,0.628334
HardCorrelationMatch,-0.488105,-0.919895,-0.629989,-0.460468,-0.876687,-0.612355,-0.474618,-0.916649,-0.639947,-0.453556,-0.894043,-0.617839,-0.451972,-0.93031,-0.614179,-0.380647,-0.856009,-0.550111
JaccardSimilarity,-0.534502,-0.764992,-0.697462,-0.535964,-0.728527,-0.697987,-0.498901,-0.853067,-0.666494,-0.460245,-0.825347,-0.624777,-0.461748,-0.857814,-0.623993,-0.364727,-0.786898,-0.522653
LinearRegression,-0.438986,-0.83875,-0.598718,-0.424974,-0.785515,-0.577432,-0.356597,-0.767644,-0.491908,-0.335762,-0.736117,-0.464767,-0.434756,-0.864312,-0.590146,-0.380986,-0.768851,-0.518028
MagnitudeDifference,-0.12537,-0.230291,-0.185317,-0.098729,-0.198162,-0.149061,0.012878,0.015327,0.018682,0.031349,0.034729,0.048306,0.048726,0.143004,0.067037,0.036254,0.126279,0.045031


In [13]:
get_output_correlation_table("label_test", "flickr")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.075699,-0.117805,-0.106484,-0.082096,-0.083086,-0.119403,-0.174759,-0.216776,-0.254891,-0.475942,-0.671375,-0.660939,-0.590132,-0.914541,-0.793491,-0.504526,-0.756979,-0.692169
CKA,-0.007603,0.007734,-0.005532,-0.174493,-0.244961,-0.262611,-0.107193,-0.159039,-0.155703,-0.409944,-0.613291,-0.595409,-0.406779,-0.639896,-0.561853,-0.570078,-0.785473,-0.773238
ConcentricityDifference,-0.037214,-0.08921,-0.060974,0.093556,0.07817,0.141156,0.00747,0.048733,0.012054,0.048652,0.064524,0.071572,0.45303,0.59349,0.647121,0.473088,0.67006,0.673326
DistanceCorrelation,-0.052733,-0.004947,-0.06558,-0.194872,-0.256748,-0.291142,0.022768,-0.051486,0.034173,-0.521249,-0.74373,-0.729528,-0.553247,-0.929313,-0.722766,-0.677458,-0.855416,-0.845032
EigenspaceOverlapScore,0.030971,0.057493,0.041775,-0.011237,0.020557,-0.016646,-0.280057,-0.456417,-0.430112,0.20388,0.111038,0.298193,-0.593611,-0.915811,-0.776732,-0.617703,-0.819038,-0.793591
Gulp,-0.026957,-0.05936,-0.04552,0.251996,0.356353,0.36235,0.053541,0.15721,0.077798,-0.010747,0.020992,-0.013569,0.593656,0.916107,0.777057,0.620245,0.820363,0.795847
HardCorrelationMatch,-0.183752,-0.197044,-0.269195,-0.334181,-0.406197,-0.472265,-0.004304,-0.032861,-0.004773,-0.516165,-0.698386,-0.724729,-0.574165,-0.906239,-0.744398,-0.718172,-0.873563,-0.885004
JaccardSimilarity,-0.145534,-0.081065,-0.221831,-0.238261,-0.293316,-0.350141,-0.272921,-0.376476,-0.417438,-0.164504,-0.103163,-0.266037,-0.536701,-0.84206,-0.711371,-0.615385,-0.744901,-0.794102
LinearRegression,0.006494,0.026687,0.010612,-0.145586,-0.182693,-0.217637,-0.011408,-0.090679,-0.011654,0.01389,-0.038739,0.02185,-0.533701,-0.863957,-0.716297,-0.599421,-0.816182,-0.781338
MagnitudeDifference,-0.051663,-0.092329,-0.076602,-0.1101,-0.166321,-0.164365,0.009165,-0.005925,0.014309,0.310858,0.406163,0.456052,0.182974,0.260688,0.26755,0.312508,0.506858,0.450695


In [14]:
get_output_correlation_table("label_test", "ogbn-arxiv")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.650813,-0.834448,-0.862018,-0.560401,-0.766566,-0.736649,-0.753501,-0.880757,-0.927873,-0.412219,-0.585844,-0.559938,-0.712526,-0.921798,-0.906427,-0.276878,-0.494089,-0.391566
CKA,-0.564533,-0.73785,-0.774701,-0.721828,-0.881106,-0.902226,-0.447358,-0.525307,-0.628396,-0.764236,-0.920409,-0.941568,-0.534372,-0.723384,-0.745787,-0.623278,-0.824721,-0.827975
ConcentricityDifference,0.073137,-0.025403,0.105955,0.461984,0.678243,0.639569,0.02233,-0.073952,0.028141,0.343902,0.32108,0.534598,0.046871,-0.023777,0.065604,0.48058,0.528894,0.692705
DistanceCorrelation,-0.648444,-0.844284,-0.858611,-0.629387,-0.80351,-0.822918,-0.537571,-0.64899,-0.732817,-0.669208,-0.853633,-0.886629,-0.624052,-0.802178,-0.841245,-0.535964,-0.757683,-0.738618
EigenspaceOverlapScore,-0.6847,-0.88354,-0.890176,-0.323969,-0.506115,-0.474025,-0.600184,-0.73999,-0.836244,-0.102876,-0.235597,-0.146856,-0.747612,-0.847237,-0.922562,-0.116789,-0.295089,-0.18326
Gulp,0.683359,0.881338,0.888764,0.391394,0.553236,0.542778,0.515911,0.122537,0.727048,0.133512,0.041163,0.181463,0.757254,0.848638,0.927237,0.130301,0.302382,0.203274
HardCorrelationMatch,-0.687471,-0.910824,-0.891366,-0.505507,-0.644775,-0.669688,-0.757744,-0.829691,-0.930964,-0.446778,-0.661899,-0.621862,-0.768101,-0.873212,-0.938249,-0.368963,-0.60368,-0.525924
JaccardSimilarity,-0.692925,-0.836132,-0.895709,-0.470903,-0.633999,-0.675379,-0.753054,-0.834614,-0.928918,-0.402185,-0.580846,-0.589277,-0.760379,-0.916531,-0.926862,-0.185686,-0.338541,-0.26603
LinearRegression,-0.635418,-0.852553,-0.856289,-0.277126,-0.408234,-0.42512,-0.536497,-0.721674,-0.745902,-0.092932,-0.178525,-0.126143,-0.740721,-0.867739,-0.918763,-0.152192,-0.290474,-0.229648
MagnitudeDifference,0.007555,-0.084838,0.009174,0.025909,-0.087285,0.035644,-0.082576,-0.14941,-0.120976,0.05369,0.011906,0.087,0.254308,0.475428,0.394629,0.106622,0.1348,0.163667


In [15]:
get_output_correlation_table("shortcut_test", "cora")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.084346,0.142265,0.113742,0.035452,0.04724,0.039324,-0.241805,-0.350989,-0.348876,-0.249008,-0.346518,-0.356693,0.092716,0.140225,0.142874,0.015028,0.031096,0.028863
CKA,-0.061072,-0.087849,-0.088566,-0.097748,-0.170038,-0.140643,-0.335741,-0.497786,-0.476726,-0.355897,-0.506638,-0.504341,-0.231388,-0.35258,-0.343904,-0.29262,-0.430762,-0.427375
ConcentricityDifference,-0.111916,-0.165641,-0.165593,-0.073534,-0.075348,-0.109595,0.176583,0.213249,0.266522,0.205931,0.241613,0.312791,-0.065875,-0.101735,-0.097933,-0.021093,-0.040942,-0.030195
DistanceCorrelation,-0.059953,-0.084395,-0.088791,-0.096499,-0.168136,-0.140059,-0.349135,-0.51068,-0.493765,-0.377525,-0.52802,-0.532597,-0.243804,-0.366627,-0.364798,-0.294627,-0.425513,-0.43229
EigenspaceOverlapScore,-0.029473,-0.278845,-0.05495,-0.076477,-0.280811,-0.126497,-0.086813,-0.173359,-0.133231,-0.062074,-0.148223,-0.098712,0.024697,0.027379,0.034852,-0.034916,-0.077886,-0.048109
Gulp,0.02437,0.277664,0.047559,0.074381,0.280183,0.12262,0.063072,0.132466,0.097678,0.049855,0.115011,0.08195,-0.006922,-0.01124,-0.006718,0.052174,0.094337,0.074544
HardCorrelationMatch,-0.269552,-0.391527,-0.380577,-0.317547,-0.401708,-0.448451,-0.245971,-0.303149,-0.353785,-0.255786,-0.298706,-0.371868,-0.216293,-0.326298,-0.317133,-0.280847,-0.406139,-0.406429
JaccardSimilarity,-0.08439,-0.207227,-0.127164,-0.127982,-0.234752,-0.193739,-0.305101,-0.418021,-0.43514,-0.315229,-0.411818,-0.455192,-0.098254,-0.149201,-0.151059,-0.160758,-0.264918,-0.242593
LinearRegression,-0.09787,-0.138093,-0.143012,-0.133601,-0.178021,-0.197584,-0.180475,-0.259206,-0.260681,-0.166271,-0.217019,-0.242733,-0.105501,-0.127213,-0.157488,-0.186689,-0.256215,-0.274516
MagnitudeDifference,-0.024639,-0.032036,-0.034505,0.007982,0.049213,0.008663,0.219228,0.303063,0.326785,0.271037,0.362033,0.402784,0.082399,0.116923,0.125951,0.105463,0.149789,0.156968


In [16]:
get_output_correlation_table("shortcut_test", "flickr")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.191678,-0.310566,-0.280539,-0.177079,-0.288528,-0.261045,-0.086544,-0.132072,-0.132732,-0.123032,-0.141067,-0.187099,-0.513029,-0.80114,-0.681401,-0.542386,-0.765174,-0.702198
CKA,0.080498,0.112315,0.118377,0.051327,0.064812,0.072535,-0.057376,-0.089652,-0.085364,-0.084994,-0.074027,-0.130309,-0.360403,-0.496312,-0.504378,-0.382787,-0.429925,-0.524492
ConcentricityDifference,-0.007983,-0.063764,-0.02328,0.018239,-0.005721,0.02127,0.005196,-0.009772,0.008768,0.012263,-0.031034,0.020808,0.717572,0.928839,0.894009,0.72495,0.954498,0.900782
DistanceCorrelation,0.028364,0.087908,0.042061,-0.007581,0.026023,-0.016858,-0.088283,-0.155947,-0.138578,-0.085084,-0.09823,-0.133558,-0.344525,-0.562446,-0.483358,-0.367447,-0.512464,-0.503502
EigenspaceOverlapScore,-0.049191,-0.121116,-0.071692,-0.03175,-0.104547,-0.046357,-0.045022,-0.074239,-0.070266,-0.086778,-0.106176,-0.132185,-0.413389,-0.481281,-0.556337,-0.433846,-0.424546,-0.574597
Gulp,0.316238,0.475386,0.48307,0.335072,0.503631,0.506488,0.03026,0.026846,0.043074,0.012174,-0.014188,0.017807,-0.060814,0.223891,-0.195507,-0.040089,0.112763,-0.17781
HardCorrelationMatch,-0.316416,-0.520786,-0.483867,-0.354337,-0.573153,-0.527278,-0.095642,-0.147096,-0.148683,-0.121382,-0.159825,-0.193319,-0.47494,-0.742214,-0.654679,-0.499844,-0.679264,-0.673611
JaccardSimilarity,-0.454489,-0.711051,-0.658291,-0.446555,-0.706316,-0.653904,-0.070845,-0.12904,-0.10895,-0.099844,-0.181103,-0.15698,-0.273564,-0.445484,-0.378247,-0.297614,-0.319966,-0.398857
LinearRegression,-0.008879,0.014951,-0.009993,-0.027313,-0.011334,-0.039584,-0.003231,0.099121,-0.005681,0.028304,0.1419,0.041821,-0.15944,-0.265828,-0.22553,-0.182712,-0.181173,-0.250872
MagnitudeDifference,-0.044998,-0.107515,-0.070391,-0.030591,-0.053344,-0.050638,0.049527,0.074236,0.070813,0.066667,0.087092,0.096026,0.637066,0.873031,0.841242,0.628629,0.925754,0.832511


In [17]:
get_output_correlation_table("shortcut_test", "ogbn-arxiv")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.494406,-0.705029,-0.687399,-0.606867,-0.829893,-0.804341,-0.478893,-0.70505,-0.668754,-0.523032,-0.784156,-0.705931,-0.485821,-0.594536,-0.654684,-0.454582,-0.605572,-0.625864
CKA,-0.491417,-0.68437,-0.688332,-0.602051,-0.821893,-0.802772,-0.604834,-0.815317,-0.80293,-0.657258,-0.903695,-0.840611,-0.367393,-0.214818,-0.459029,-0.339041,-0.217113,-0.427015
ConcentricityDifference,0.102192,0.106593,0.165442,0.161962,0.134704,0.253512,0.363123,0.546285,0.53986,0.408339,0.604903,0.598688,0.81385,0.9553,0.955258,0.781182,0.953046,0.9401
DistanceCorrelation,-0.46438,-0.655172,-0.655421,-0.565307,-0.792375,-0.765802,-0.608091,-0.81421,-0.805405,-0.657659,-0.905582,-0.841552,-0.356554,-0.272685,-0.453674,-0.327001,-0.277578,-0.42035
EigenspaceOverlapScore,-0.489677,-0.713961,-0.677148,-0.605619,-0.830569,-0.795505,-0.498344,-0.580287,-0.695839,-0.547871,-0.665981,-0.74379,-0.708849,-0.886309,-0.887684,-0.682542,-0.892117,-0.864802
Gulp,0.488205,0.713027,0.675828,0.602809,0.829105,0.79298,0.436109,0.530252,0.621216,0.482319,0.608299,0.662838,0.463831,0.409743,0.624452,0.438796,0.403046,0.593152
HardCorrelationMatch,-0.523406,-0.746359,-0.716494,-0.618149,-0.853872,-0.808571,-0.365666,-0.429009,-0.532186,-0.409944,-0.50435,-0.572619,-0.466596,-0.442217,-0.599404,-0.434337,-0.446342,-0.566279
JaccardSimilarity,-0.497574,-0.703004,-0.683402,-0.601873,-0.824198,-0.78558,-0.602157,-0.821936,-0.803491,-0.64981,-0.883104,-0.837334,-0.445275,-0.366385,-0.611193,-0.41204,-0.362234,-0.579861
LinearRegression,-0.426012,-0.553682,-0.60308,-0.509229,-0.645272,-0.703691,-0.4279,-0.599427,-0.607009,-0.45242,-0.670941,-0.629959,-0.100613,0.005919,-0.143357,-0.073896,-0.005419,-0.104285
MagnitudeDifference,0.245229,0.31046,0.375611,0.32223,0.386105,0.488033,0.203321,0.295021,0.306208,0.198261,0.270803,0.298448,0.207037,0.007953,0.310186,0.193712,-0.002602,0.287822


In [18]:
get_output_correlation_table("augmentation_test", "cora")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,0.204598,0.234288,0.250005,-0.022222,-0.085014,0.042424,-0.26968,-0.444145,-0.328269,-0.288889,-0.401172,-0.369697,0.179787,0.407533,0.25532,-0.377778,-0.261401,-0.563636
CKA,0.159132,0.156891,0.152442,-0.333333,-0.4505,-0.454545,-0.179787,-0.432928,-0.267478,-0.244444,-0.544134,-0.393939,0.089893,0.173408,0.151976,-0.466667,-0.42031,-0.612121
ConcentricityDifference,-0.295531,-0.459046,-0.475619,-0.066667,-0.028583,-0.090909,0.0,0.038238,0.012158,-0.111111,-0.024804,-0.163636,0.044947,-0.030425,0.079028,-0.155556,-0.236169,-0.309091
DistanceCorrelation,0.159132,0.11588,0.152442,-0.333333,-0.476871,-0.454545,-0.224733,-0.517919,-0.291795,-0.333333,-0.596473,-0.418182,-0.044947,0.0316,-0.006079,-0.511111,-0.559428,-0.648485
EigenspaceOverlapScore,0.068199,0.01087,0.067074,-0.244444,-0.528755,-0.284848,0.179787,0.103494,0.218846,0.288889,0.322481,0.393939,-0.224733,-0.234075,-0.376901,-0.688889,-0.796131,-0.781818
Gulp,-0.113666,-0.003025,-0.07927,0.288889,0.60044,0.381818,-0.179787,-0.050501,-0.224925,-0.288889,-0.262299,-0.418182,0.314627,0.286335,0.504562,0.777778,0.85935,0.866667
HardCorrelationMatch,-0.204598,-0.398758,-0.310981,-0.288889,-0.38243,-0.357576,-0.179787,-0.524525,-0.346506,-0.244444,-0.524963,-0.357576,-0.13484,-0.152698,-0.164134,-0.422222,-0.577564,-0.612121
JaccardSimilarity,-0.113666,-0.125135,-0.140247,0.155556,0.010643,0.2,-0.6742,-0.784963,-0.741645,-0.6,-0.728129,-0.781818,0.044947,-0.05827,-0.012158,-0.6,-0.654824,-0.745455
LinearRegression,0.298712,0.270406,0.362964,0.216295,0.238555,0.307927,-0.240613,-0.375924,-0.31492,-0.22711,-0.349925,-0.307927,-0.142181,-0.232277,-0.210452,-0.551553,-0.667256,-0.697363
MagnitudeDifference,-0.340997,-0.415221,-0.451228,-0.288889,-0.193101,-0.369697,-0.044947,-0.055668,-0.036474,-0.155556,-0.141509,-0.236364,0.0,-0.130573,0.006079,-0.288889,-0.372199,-0.345455


In [19]:
get_output_correlation_table("augmentation_test", "flickr")

architecture,GAT,GAT,GAT,GAT,GAT,GAT,GCN,GCN,GCN,GCN,GCN,GCN,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE,GraphSAGE
functional_similarity_measure,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD,Disagreement,Disagreement,Disagreement,JSD,JSD,JSD
quality_measure,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr,kendalltau,pearsonr,spearmanr
similarity_measure,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3
AlignedCosineSimilarity,-0.271691,-0.377773,-0.40112,-0.410479,-0.574452,-0.582532,-0.246544,-0.168841,-0.369278,-0.276566,-0.175408,-0.396806,-0.558819,-0.774821,-0.738477,-0.64214,-0.829531,-0.838249
CKA,-0.096064,-0.208925,-0.14908,-0.162542,-0.337277,-0.238281,-0.270939,-0.348259,-0.398087,-0.394426,-0.328926,-0.55729,-0.570329,-0.773743,-0.752002,-0.830769,-0.960698,-0.963217
ConcentricityDifference,0.187892,0.240331,0.27538,0.23398,0.255272,0.338894,0.076398,0.056254,0.121207,0.054404,0.061732,0.084828,0.028754,0.050215,0.043245,-0.067826,-0.107853,-0.100758
DistanceCorrelation,-0.22696,-0.283499,-0.338588,-0.324326,-0.447187,-0.476038,-0.199447,-0.208134,-0.293297,-0.307559,-0.215063,-0.414698,-0.583669,-0.796334,-0.765426,-0.814404,-0.953151,-0.955005
EigenspaceOverlapScore,-0.237351,-0.327099,-0.359101,-0.281695,-0.397515,-0.416631,-0.241682,-0.329432,-0.357847,-0.470502,-0.386312,-0.663211,-0.512687,-0.64903,-0.691481,-0.788004,-0.818767,-0.941336
Gulp,0.307771,0.387008,0.430528,0.478172,0.642937,0.648993,-0.012086,-0.056925,-0.019846,-0.048473,-0.108029,-0.070109,0.513758,0.649946,0.692457,0.789253,0.818863,0.941594
HardCorrelationMatch,-0.335734,-0.448182,-0.487163,-0.465596,-0.627715,-0.637693,-0.342967,-0.438603,-0.497091,-0.476031,-0.438001,-0.644055,-0.557168,-0.752962,-0.736323,-0.815117,-0.935311,-0.953469
JaccardSimilarity,-0.360129,-0.394317,-0.487002,-0.476433,-0.598656,-0.641084,-0.300107,-0.371427,-0.450981,-0.422074,-0.375958,-0.589366,-0.589781,-0.752075,-0.768382,-0.753668,-0.879063,-0.918161
LinearRegression,-0.094842,-0.097058,-0.143719,-0.18215,-0.23698,-0.260674,0.034424,-0.025315,0.05537,0.02963,-0.033827,0.058414,-0.461965,-0.658084,-0.639218,-0.724155,-0.887786,-0.903254
MagnitudeDifference,0.13201,0.160847,0.196387,0.109298,0.130463,0.170528,0.057756,-0.031929,0.086353,-0.026934,-0.080743,-0.043596,0.07377,0.119153,0.106635,0.079599,0.118734,0.114531


### CD Plots

In [16]:
# autorank package needed for creation of CD plots 
from autorank import autorank, plot_stats, create_report, latex_table
from autorank._util import *
from matplotlib import pyplot as plt

In [17]:
def get_figsize(columnwidth, wf=0.5, hf=(5. ** 0.5 - 1.0) / 2.0):
    """ Credit: https://stackoverflow.com/a/31527287
    Parameters:
      - wf [float]:  width fraction in columnwidth units
      - hf [float]:  height fraction in columnwidth units.
                     Set by default to golden ratio.
      - columnwidth [float]: width of the column in latex. Get this from LaTeX
                             using \showthe\columnwidth
    Returns:  [fig_width,fig_height]: that should be given to matplotlib
    """
    fig_width_pt = columnwidth * wf
    inches_per_pt = 1.0 / 72.27  # Convert pt to inch
    fig_width = fig_width_pt * inches_per_pt  # width in inches
    fig_height = fig_width * hf  # height in inches
    return fig_width, fig_height

PLOTS_BASE_WIDTH = 433.62  # pt
PLOTS_CD_WIDTH, PLOTS_CD_HEIGHT = get_figsize(PLOTS_BASE_WIDTH, wf=1.5)

In [18]:
def get_autorank_df(experiments=EXPERIMENTS, datasets=DATASETS, architectures=ARCHITECTURES, quality_measure = "violation_rate"):
    dfs = []
    for experiment in experiments:
        for dataset in datasets:
            path = os.path.join(EXPERIMENT_RESULTS_PATH, FULL_DF_FILE_NAME(experiment, COMPARISON_TYPE_DICT[experiment], dataset))
            df = pd.read_csv(path)
            df["experiment"] = experiment
            data = df.loc[:, ["similarity_measure", "quality_measure", "value", "architecture", "representation_dataset", "experiment"]]
            data = data.loc[data.loc[:,"architecture"].isin(architectures)]
            data = data.loc[data.loc[:,"quality_measure"]==quality_measure]
            dfs.append(data)
            
    df_cc = pd.concat(dfs, axis=0)
    df_res = df_cc.pivot_table(index="similarity_measure", columns=["experiment", "representation_dataset", "architecture"], values="value", aggfunc="mean")
    return df_res.transpose()

In [19]:
res_df = get_autorank_df()
result = autorank(-res_df, alpha=0.05, verbose=False)
cd_diagram(result, False, None, PLOTS_CD_WIDTH)
fig = plt.gcf()
fig.set_size_inches(PLOTS_CD_WIDTH, PLOTS_CD_HEIGHT)
plt.savefig(f"cd_test.png", bbox_inches="tight")
plt.close()

  if abs(sorted_ranks[i] - sorted_ranks[j]) <= critical_difference:
  plot_line([(rankpos(sorted_ranks[i]), cline),
  (rankpos(sorted_ranks[i]), chei),
  plot_line([(rankpos(sorted_ranks[i]), cline),
  (rankpos(sorted_ranks[i]), chei),
  plot_line([(rankpos(sorted_ranks[l]) - side, start),
  (rankpos(sorted_ranks[r]) + side, start)],


In [20]:
get_autorank_df()

Unnamed: 0_level_0,Unnamed: 1_level_0,similarity_measure,AlignedCosineSimilarity,CKA,ConcentricityDifference,DistanceCorrelation,EigenspaceOverlapScore,Gulp,HardCorrelationMatch,JaccardSimilarity,LinearRegression,MagnitudeDifference,...,OrthogonalProcrustesCenteredAndNormalized,PermutationProcrustes,ProcrustesSizeAndShapeDistance,RSA,RSMNormDifference,RankSimilarity,SVCCA,SecondOrderCosineSimilarity,SoftCorrelationMatch,UniformityDifference
experiment,representation_dataset,architecture,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1
augmentation_test,cora,GAT,0.1632,0.1036,0.272,0.0962,0.3412,0.3356,0.32,0.0814,0.1034,0.2624,...,0.1166,0.5296,0.1658,0.1902,,0.1024,0.4796,0.0722,0.3112,0.0164
augmentation_test,cora,GCN,0.3348,0.2336,0.4934,0.203,0.276,0.3316,0.2794,0.1826,0.0962,0.4514,...,0.1994,0.3126,0.232,0.4042,,0.324,0.5056,0.1982,0.2568,0.2376
augmentation_test,cora,GraphSAGE,0.2764,0.2136,0.3558,0.2138,0.233,0.2248,0.2398,0.182,0.1488,0.3912,...,0.1936,0.2984,0.2272,0.321,,0.2342,0.4818,0.1812,0.2204,0.2352
augmentation_test,flickr,GAT,0.1934,0.2368,0.2692,0.1934,0.3024,0.1608,0.168,0.1342,0.2612,0.342,...,0.2244,0.3522,0.323,0.1602,,0.1416,0.267,0.1368,0.1688,0.34
augmentation_test,flickr,GCN,0.0486,0.072,0.342,0.0636,0.1648,0.4862,0.0724,0.0346,0.4664,0.165,...,0.0608,0.071,0.0428,0.0478,,0.0332,0.0646,0.0276,0.0744,0.0456
augmentation_test,flickr,GraphSAGE,0.1868,0.1488,0.3868,0.1694,0.3414,0.3358,0.2224,0.1526,0.2196,0.5398,...,0.2148,0.1722,0.1006,0.2182,,0.1466,0.2322,0.1196,0.286,0.4978
augmentation_test,ogbn-arxiv,GAT,0.0694,0.0804,0.2508,0.0744,0.093,0.1018,0.3892,0.0314,0.0976,0.1638,...,0.099,0.1122,0.0026,0.207,,0.031,0.2578,0.0224,0.4754,0.2452
augmentation_test,ogbn-arxiv,GCN,0.1524,0.0738,0.2992,0.0792,0.1654,0.357,0.502,0.0526,0.2646,0.1916,...,0.2428,0.162,0.0962,0.1242,,0.0502,0.2068,0.047,0.5412,0.1518
augmentation_test,ogbn-arxiv,GraphSAGE,0.5114,0.0486,0.2402,0.058,0.4192,0.415,0.4236,0.1136,0.2784,0.0006,...,0.295,0.2262,0.0446,0.3812,,0.0772,0.1688,0.0688,0.4738,0.2374
label_test,cora,GAT,0.4274,0.489,0.36,0.4788,0.4564,0.45,0.4996,0.4624,0.3986,0.3594,...,0.4812,0.4134,0.4138,0.4822,0.249,0.393,0.4292,0.2208,0.4942,0.421
