# GAE benchmark results

In [1]:
import numpy as np
%matplotlib inline
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sb

## AN2VEC

In [2]:
results = pd.read_csv('../data/behaviour/gae-benchmarks/lp-bias=[true, false]-sharedl1=[true, false]-'
                      'decadjdeep=[true, false]-dataset=[cora, citeseer, pubmed]-'
                      'overlap=[0, 8, 16]-testprop=[0.15, 0.30]-nsamples=10.csv.gz',
                      compression='gzip')
last_epoch = sorted(np.unique(results.epoch))[-1]
results = results[results.epoch == last_epoch]

In [3]:
averages = results.groupby(['bias', 'sharedl1', 'decadjdeep', 'dataset', 'overlap', 'blurring']).mean()
stds = results.groupby(['bias', 'sharedl1', 'decadjdeep', 'dataset', 'overlap', 'blurring']).std()

### Shared l1

In [4]:
averages.xs([False, True])\
    [['auc', 'ap']]\
    .stack().unstack([1, 4])\
    .reorder_levels(['blurring', 'decadjdeep', 'overlap']).sort_index()\
    [['cora', 'citeseer', 'pubmed']]

Unnamed: 0_level_0,Unnamed: 1_level_0,dataset,cora,cora,citeseer,citeseer,pubmed,pubmed
Unnamed: 0_level_1,Unnamed: 1_level_1,Unnamed: 2_level_1,auc,ap,auc,ap,auc,ap
blurring,decadjdeep,overlap,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
0.15,False,0,0.928669,0.932253,0.940158,0.94551,0.950613,0.953707
0.15,False,8,0.930294,0.935635,0.944549,0.948189,0.946433,0.948626
0.15,False,16,0.932945,0.936042,0.94822,0.951456,0.930713,0.930576
0.15,True,0,0.883429,0.894645,0.908322,0.913254,0.917656,0.931821
0.15,True,8,0.887484,0.896085,0.902848,0.909423,0.918967,0.930725
0.15,True,16,0.892824,0.903344,0.904231,0.911761,0.920825,0.927513
0.3,False,0,0.916112,0.92412,0.934943,0.938995,0.948759,0.950269
0.3,False,8,0.918903,0.926251,0.935658,0.939858,0.941399,0.943468
0.3,False,16,0.921719,0.92889,0.943262,0.948098,0.924663,0.92399
0.3,True,0,0.868274,0.880303,0.892681,0.90044,0.910215,0.924337


In [5]:
stds.xs([False, True])\
    [['auc', 'ap']]\
    .stack().unstack([1, 4])\
    .reorder_levels(['blurring', 'decadjdeep', 'overlap']).sort_index()\
    [['cora', 'citeseer', 'pubmed']]

Unnamed: 0_level_0,Unnamed: 1_level_0,dataset,cora,cora,citeseer,citeseer,pubmed,pubmed
Unnamed: 0_level_1,Unnamed: 1_level_1,Unnamed: 2_level_1,auc,ap,auc,ap,auc,ap
blurring,decadjdeep,overlap,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
0.15,False,0,0.004995,0.007034,0.005996,0.005695,0.006221,0.005054
0.15,False,8,0.003856,0.005355,0.007048,0.007055,0.005213,0.004407
0.15,False,16,0.007901,0.007053,0.004446,0.004953,0.006167,0.005951
0.15,True,0,0.008031,0.008416,0.014037,0.015891,0.006894,0.00581
0.15,True,8,0.016852,0.01873,0.013327,0.012892,0.004525,0.004613
0.15,True,16,0.008851,0.010439,0.013957,0.012869,0.00961,0.009229
0.3,False,0,0.007145,0.006813,0.003441,0.003182,0.003814,0.003474
0.3,False,8,0.003457,0.003879,0.006418,0.007233,0.00961,0.009046
0.3,False,16,0.006675,0.006816,0.006928,0.007518,0.006093,0.007091
0.3,True,0,0.012494,0.011262,0.012345,0.01142,0.003784,0.003233


### Unshared l1

In [6]:
averages.xs([False, False])\
    [['auc', 'ap']]\
    .stack().unstack([1, 4])\
    .reorder_levels(['blurring', 'decadjdeep', 'overlap']).sort_index()\
    [['cora', 'citeseer', 'pubmed']]

Unnamed: 0_level_0,Unnamed: 1_level_0,dataset,cora,cora,citeseer,citeseer,pubmed,pubmed
Unnamed: 0_level_1,Unnamed: 1_level_1,Unnamed: 2_level_1,auc,ap,auc,ap,auc,ap
blurring,decadjdeep,overlap,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
0.15,False,0,0.916601,0.923915,0.919691,0.927372,0.96568,0.969072
0.15,False,8,0.92887,0.935104,0.943409,0.947078,0.957962,0.959257
0.15,False,16,0.932651,0.938988,0.951359,0.954687,0.935675,0.937016
0.15,True,0,0.880535,0.891037,0.883291,0.891384,0.911545,0.928493
0.15,True,8,0.885794,0.895053,0.909604,0.916489,0.924394,0.936358
0.15,True,16,0.889915,0.900254,0.904428,0.908407,0.927221,0.934089
0.3,False,0,0.908178,0.917985,0.913309,0.921215,0.960803,0.964172
0.3,False,8,0.919074,0.928667,0.937642,0.94444,0.951806,0.953308
0.3,False,16,0.925996,0.934058,0.94839,0.953407,0.93146,0.930151
0.3,True,0,0.852377,0.863708,0.887003,0.895765,0.90238,0.919668


In [7]:
stds.xs([False, False])\
    [['auc', 'ap']]\
    .stack().unstack([1, 4])\
    .reorder_levels(['blurring', 'decadjdeep', 'overlap']).sort_index()\
    [['cora', 'citeseer', 'pubmed']]

Unnamed: 0_level_0,Unnamed: 1_level_0,dataset,cora,cora,citeseer,citeseer,pubmed,pubmed
Unnamed: 0_level_1,Unnamed: 1_level_1,Unnamed: 2_level_1,auc,ap,auc,ap,auc,ap
blurring,decadjdeep,overlap,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2
0.15,False,0,0.007002,0.006596,0.006838,0.007313,0.002308,0.00226
0.15,False,8,0.005474,0.006348,0.005143,0.006403,0.003672,0.003106
0.15,False,16,0.007582,0.006859,0.00559,0.005295,0.006327,0.007203
0.15,True,0,0.01175,0.012127,0.012768,0.012948,0.006618,0.005229
0.15,True,8,0.015177,0.015717,0.01037,0.009894,0.002993,0.002054
0.15,True,16,0.013341,0.012045,0.017095,0.020589,0.005223,0.005234
0.3,False,0,0.007715,0.007088,0.008522,0.006905,0.001426,0.001344
0.3,False,8,0.003609,0.004005,0.006929,0.006274,0.003647,0.003475
0.3,False,16,0.003889,0.004303,0.004287,0.003986,0.006295,0.006671
0.3,True,0,0.007811,0.00946,0.014551,0.014217,0.006107,0.004534


## VGAE

In [8]:
results_vgae = pd.read_csv('../data/behaviour/gae-benchmarks/lp-vgae-'
                           'dataset=[cora, citeseer, pubmed]-testprop=[0.15, 0.30]-nsamples=10.csv.gz',
                           compression='gzip')
last_epoch = sorted(np.unique(results_vgae.epoch))[-1]
results_vgae = results_vgae[results_vgae.epoch == last_epoch]

In [9]:
averages_vgae = results_vgae.groupby(['dataset', 'blurring']).mean()
stds_vgae = results_vgae.groupby(['dataset', 'blurring']).std()

In [10]:
averages_vgae[['auc', 'ap']].stack().unstack([0, 2])[['cora', 'citeseer', 'pubmed']]

dataset,cora,cora,citeseer,citeseer,pubmed,pubmed
Unnamed: 0_level_1,auc,ap,auc,ap,auc,ap
blurring,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2
0.15,0.922591,0.928798,0.921745,0.930244,0.965447,0.968721
0.3,0.902977,0.913436,0.911954,0.919151,0.961535,0.96456


In [11]:
stds_vgae[['auc', 'ap']].stack().unstack([0, 2])[['cora', 'citeseer', 'pubmed']]

dataset,cora,cora,citeseer,citeseer,pubmed,pubmed
Unnamed: 0_level_1,auc,ap,auc,ap,auc,ap
blurring,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2
0.15,0.00555,0.005833,0.006499,0.006631,0.001501,0.001229
0.3,0.004795,0.004589,0.005465,0.005182,0.001503,0.001434
