In [1]:
# Domain distance arrays
tvo = [0.1739, 0.2027, 0.1629, 0.1884, 0.3129 ]
kld = [2.3341, 2.1348, 1.9357, 1.9758, 2.2342]
jsd = [0.3896, 0.3692, 0.3412, 0.3832, 0.4403]
rd = [2.3125, 2.1151, 1.9176, 1.9633, 2.2239]

# Model scores (unsupervised setting)
zs = [20.13, 15.74, 25.71, 23.27, 62.95]
la = [18.30, 21.69, 28.02, 27.76, 70.31]
pl = [22.60, 8.28, 31.52, 18.17, 55.06]
pt = [20.70, 19.11, 27.30, 16.57, 61.19]
iw = [20.23, 17.91, 24.43, 26.62, 63.08]

# Model scores (supervised setting)
tg = [88.57, 76.50, 84.75, 87.98]
fa = [79.38, 74.78, 75.96, 88.40]
la = [85.56, 79.66, 83.31, 87.99]
iw = [82.03, 78.35, 84.88, 88.39]

In [5]:
# Compute percentage change in model scores over baseline (zero-shot or max of TG, SC->TG, SC+TG)
def perc_change(base, model):
    return [((y-x)/float(x)) * 100 for x,y in zip(base, model)]

unsup_la = perc_change(zs, la)
unsup_pl = perc_change(zs, pl)
unsup_pt = perc_change(zs, pt)
unsup_iw = perc_change(zs, iw)

sup_fa = perc_change(tg, fa)
sup_la = perc_change(tg, la)
sup_iw = perc_change(tg, iw)

In [7]:
# Unsupervised setting analysis
# Compute pearson correlation between each distance metric and model score change
from scipy.stats import pearsonr

def compute_corr(scores):
    tvo_corr, _ = pearsonr(tvo[:len(scores)], scores)
    kld_corr, _ = pearsonr(kld[:len(scores)], scores)
    jsd_corr, _ = pearsonr(jsd[:len(scores)], scores)
    rd_corr, _ = pearsonr(rd[:len(scores)], scores)
    print('Correlation with TVO: {}'.format(tvo_corr))
    print('Correlation with KLD: {}'.format(kld_corr))
    print('Correlation with JSD: {}'.format(jsd_corr))
    print('Correlation with RD: {}'.format(rd_corr))

print('Correlation for LA')
compute_corr(unsup_la)
print('Correlation for PL')
compute_corr(unsup_pl)
print('Correlation for PT')
compute_corr(unsup_pt)
print('Correlation for IW')
compute_corr(unsup_iw)

Correlation for LA
Correlation with TVO: 0.8245560726972885
Correlation with KLD: 0.5945629261773661
Correlation with JSD: 0.45797107883013555
Correlation with RD: 0.5948180067993223
Correlation for PL
Correlation with TVO: -0.3064999943236373
Correlation with KLD: -0.019848269226881123
Correlation with JSD: -0.21113577824114504
Correlation with RD: -0.025833102653059645
Correlation for PT
Correlation with TVO: -0.04917813651216771
Correlation with KLD: 0.2929358118883449
Correlation with JSD: -0.2635171629766521
Correlation with RD: 0.27632717941324153
Correlation for IW
Correlation with TVO: 0.8670277237945417
Correlation with KLD: 0.5028959416572347
Correlation with JSD: 0.3973771770844403
Correlation with RD: 0.5030773567997168


In [8]:
print('Correlation for FA')
compute_corr(sup_fa)
print('Correlation for LA')
compute_corr(sup_la)
print('Correlation for IW')
compute_corr(sup_iw)

Correlation for FA
Correlation with TVO: 0.8197696225211281
Correlation with KLD: -0.32040789157781613
Correlation with JSD: 0.3369453861865519
Correlation with RD: -0.31036985333143285
Correlation for LA
Correlation with TVO: 0.8675749071279878
Correlation with KLD: -0.21598626611566804
Correlation with JSD: -0.09638305185906468
Correlation with RD: -0.2162932856906837
Correlation for IW
Correlation with TVO: 0.4896655431369238
Correlation with KLD: -0.7459629359440898
Correlation with JSD: -0.508239680277131
Correlation with RD: -0.7470760879452625
