In [156]:
import matplotlib.pyplot as plt
from IPython.display import display, Markdown, Latex
import numpy as np
import json
import pandas as pd
from scipy import stats

with open('transfer_experiment.json', 'r') as fp:
    data = json.load(fp)

In [157]:
experiments = [
            {'id': '1', 'source':'imdb', 'target':'uwcse', 'predicate':'workedunder', 'to_predicate':'advisedby'},
            {'id': '2', 'source':'uwcse', 'target':'imdb', 'predicate':'advisedby', 'to_predicate':'workedunder'},
            {'id': '3', 'source':'imdb', 'target':'uwcse', 'predicate':'movie', 'to_predicate':'publication'},
            {'id': '4', 'source':'uwcse', 'target':'imdb', 'predicate':'publication', 'to_predicate':'movie'},
            {'id': '5', 'source':'imdb', 'target':'uwcse', 'predicate':'genre', 'to_predicate':'inphase'},
            {'id': '6', 'source':'uwcse', 'target':'imdb', 'predicate':'inphase', 'to_predicate':'genre'},
            {'id': '7', 'source':'imdb', 'target':'cora', 'predicate':'workedunder', 'to_predicate':'samevenue'},
            {'id': '8', 'source':'imdb', 'target':'cora', 'predicate':'workedunder', 'to_predicate':'samebib'},
            {'id': '9', 'source':'imdb', 'target':'cora', 'predicate':'workedunder', 'to_predicate':'sameauthor'},
            {'id': '10', 'source':'imdb', 'target':'cora', 'predicate':'workedunder', 'to_predicate':'sametitle'},
            {'id': '11', 'source':'uwcse', 'target':'cora', 'predicate':'advisedby', 'to_predicate':'samevenue'},
            {'id': '12', 'source':'uwcse', 'target':'cora', 'predicate':'advisedby', 'to_predicate':'samebib'},
            {'id': '13', 'source':'uwcse', 'target':'cora', 'predicate':'advisedby', 'to_predicate':'sameauthor'},
            {'id': '14', 'source':'uwcse', 'target':'cora', 'predicate':'advisedby', 'to_predicate':'sametitle'},
            {'id': '15', 'source':'yeast', 'target':'twitter', 'predicate':'proteinclass', 'to_predicate':'accounttype'},
            {'id': '16', 'source':'yeast', 'target':'twitter', 'predicate':'interaction', 'to_predicate':'follows'},
            {'id': '17', 'source':'yeast', 'target':'twitter', 'predicate':'location', 'to_predicate':'tweets'},
            {'id': '18', 'source':'yeast', 'target':'twitter', 'predicate':'enzyme', 'to_predicate':'tweets'},
            {'id': '19', 'source':'yeast', 'target':'twitter', 'predicate':'function', 'to_predicate':'tweets'},
            {'id': '20', 'source':'yeast', 'target':'twitter', 'predicate':'phenotype', 'to_predicate':'tweets'},
            {'id': '21', 'source':'yeast', 'target':'twitter', 'predicate':'complex', 'to_predicate':'tweets'},
            {'id': '22', 'source':'twitter', 'target':'yeast', 'predicate':'accounttype', 'to_predicate':'proteinclass'},
            {'id': '23', 'source':'twitter', 'target':'yeast', 'predicate':'follows', 'to_predicate':'interaction'},
            {'id': '24', 'source':'twitter', 'target':'yeast', 'predicate':'tweets', 'to_predicate':'location'},
            {'id': '25', 'source':'twitter', 'target':'yeast', 'predicate':'tweets', 'to_predicate':'enzyme'},
            {'id': '26', 'source':'twitter', 'target':'yeast', 'predicate':'tweets', 'to_predicate':'function'},
            {'id': '27', 'source':'twitter', 'target':'yeast', 'predicate':'tweets', 'to_predicate':'phenotype'},
            {'id': '28', 'source':'twitter', 'target':'yeast', 'predicate':'tweets', 'to_predicate':'complex'},
            ]

for metric in ['AUC ROC', 'AUC PR', 'CLL', 'Recall', 'F1', 'Precision', 'Learning and Revision time', 'Inference time']:
    display(Markdown('# Results for ' + metric))
    table = []
    for j in range(len(experiments)):
        dataset = experiments[j]['id'] + '_' + experiments[j]['source'] + '_' + experiments[j]['target']
        if dataset in data['results']: 
            #for metric in ['AUC ROC', 'AUC PR']:
                #display(Markdown('## ' + metric))
            if metric == 'Precision':
                scratch = np.array([item['scratch']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
            elif metric == 'Learning and Revision time':
                scratch = np.array([item['scratch']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
            elif metric == 'Inference time':
                scratch = np.array([item['scratch']['Inference time'] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Inference time'] for sublist in data['results'][str(dataset)] for item in sublist])
            else:
                scratch = np.array([item['scratch'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
            table.append([dataset, '%.3f +/- %.3f' % (parameter.mean(), 2 * parameter.std()),
            '%.3f +/- %.3f' % (transfer.mean(), 2 * transfer.std()),
            '%.3f +/- %.3f' % (scratch.mean(), 2 * scratch.std())])
    display(pd.DataFrame(table, columns=['Experiment', 'Transfer Learning', 'Transfer Learning with Revision Theory', 'Learning from scratch']))

# Results for AUC ROC

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,0.956 +/- 0.007,0.948 +/- 0.023,0.934 +/- 0.072
1,2_uwcse_imdb,1.000 +/- 0.000,1.000 +/- 0.000,0.981 +/- 0.077
2,3_imdb_uwcse,0.625 +/- 0.130,0.624 +/- 0.126,0.604 +/- 0.118
3,4_uwcse_imdb,0.497 +/- 0.003,0.495 +/- 0.014,0.490 +/- 0.014
4,5_imdb_uwcse,0.500 +/- 0.000,0.499 +/- 0.014,0.501 +/- 0.025
5,6_uwcse_imdb,0.907 +/- 0.063,0.907 +/- 0.063,0.827 +/- 0.333
6,7_imdb_cora,0.525 +/- 0.089,0.613 +/- 0.248,0.678 +/- 0.291
7,8_imdb_cora,0.655 +/- 0.309,0.928 +/- 0.031,0.936 +/- 0.007
8,9_imdb_cora,0.675 +/- 0.063,0.659 +/- 0.198,0.533 +/- 0.241
9,10_imdb_cora,0.506 +/- 0.004,0.688 +/- 0.176,0.763 +/- 0.139


# Results for AUC PR

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,0.939 +/- 0.015,0.911 +/- 0.042,0.888 +/- 0.121
1,2_uwcse_imdb,1.000 +/- 0.000,1.000 +/- 0.000,0.968 +/- 0.130
2,3_imdb_uwcse,0.597 +/- 0.103,0.603 +/- 0.113,0.595 +/- 0.109
3,4_uwcse_imdb,0.497 +/- 0.009,0.494 +/- 0.005,0.493 +/- 0.008
4,5_imdb_uwcse,0.500 +/- 0.000,0.503 +/- 0.012,0.505 +/- 0.016
5,6_uwcse_imdb,0.845 +/- 0.095,0.845 +/- 0.095,0.779 +/- 0.294
6,7_imdb_cora,0.532 +/- 0.089,0.606 +/- 0.221,0.662 +/- 0.244
7,8_imdb_cora,0.760 +/- 0.284,0.955 +/- 0.032,0.965 +/- 0.013
8,9_imdb_cora,0.944 +/- 0.008,0.942 +/- 0.038,0.919 +/- 0.066
9,10_imdb_cora,0.565 +/- 0.041,0.724 +/- 0.151,0.781 +/- 0.089


# Results for CLL

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,-0.229 +/- 0.007,-0.242 +/- 0.045,-0.257 +/- 0.098
1,2_uwcse_imdb,-0.116 +/- 0.021,-0.112 +/- 0.031,-0.174 +/- 0.148
2,3_imdb_uwcse,-0.660 +/- 0.042,-0.692 +/- 0.069,-0.701 +/- 0.059
3,4_uwcse_imdb,-0.701 +/- 0.020,-0.708 +/- 0.020,-0.707 +/- 0.017
4,5_imdb_uwcse,-0.695 +/- 0.000,-0.715 +/- 0.020,-0.718 +/- 0.025
5,6_uwcse_imdb,-0.312 +/- 0.052,-0.307 +/- 0.058,-0.458 +/- 0.598
6,7_imdb_cora,-0.690 +/- 0.020,-0.640 +/- 0.193,-0.603 +/- 0.215
7,8_imdb_cora,-0.622 +/- 0.354,-0.348 +/- 0.145,-0.344 +/- 0.146
8,9_imdb_cora,-0.256 +/- 0.002,-0.310 +/- 0.170,-0.315 +/- 0.095
9,10_imdb_cora,-0.705 +/- 0.030,-0.625 +/- 0.074,-0.584 +/- 0.177


# Results for Recall

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,1.000 +/- 0.000,0.992 +/- 0.020,0.984 +/- 0.043
1,2_uwcse_imdb,1.000 +/- 0.000,1.000 +/- 0.000,1.000 +/- 0.000
2,3_imdb_uwcse,0.543 +/- 0.543,0.508 +/- 0.133,0.494 +/- 0.126
3,4_uwcse_imdb,0.039 +/- 0.102,0.298 +/- 0.432,0.285 +/- 0.394
4,5_imdb_uwcse,0.000 +/- 0.000,0.451 +/- 0.169,0.407 +/- 0.163
5,6_uwcse_imdb,1.000 +/- 0.000,1.000 +/- 0.000,0.800 +/- 0.800
6,7_imdb_cora,0.768 +/- 0.769,0.758 +/- 0.706,0.773 +/- 0.670
7,8_imdb_cora,0.727 +/- 0.556,0.894 +/- 0.082,0.899 +/- 0.078
8,9_imdb_cora,1.000 +/- 0.000,0.979 +/- 0.084,0.978 +/- 0.088
9,10_imdb_cora,0.400 +/- 0.980,0.702 +/- 0.554,0.701 +/- 0.552


# Results for F1

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,0.942 +/- 0.004,0.941 +/- 0.008,0.930 +/- 0.024
1,2_uwcse_imdb,1.000 +/- 0.000,1.000 +/- 0.000,0.949 +/- 0.084
2,3_imdb_uwcse,nan +/- nan,0.554 +/- 0.102,0.546 +/- 0.097
3,4_uwcse_imdb,nan +/- nan,nan +/- nan,nan +/- nan
4,5_imdb_uwcse,nan +/- nan,0.469 +/- 0.108,0.443 +/- 0.102
5,6_uwcse_imdb,0.915 +/- 0.054,0.915 +/- 0.054,nan +/- nan
6,7_imdb_cora,nan +/- nan,0.608 +/- 0.532,0.660 +/- 0.508
7,8_imdb_cora,0.706 +/- 0.275,0.891 +/- 0.115,0.892 +/- 0.116
8,9_imdb_cora,0.971 +/- 0.004,0.961 +/- 0.042,0.952 +/- 0.040
9,10_imdb_cora,nan +/- nan,0.656 +/- 0.240,0.690 +/- 0.329


# Results for Precision

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,0.889 +/- 0.008,0.895 +/- 0.014,0.882 +/- 0.052
1,2_uwcse_imdb,1.000 +/- 0.000,1.000 +/- 0.000,0.905 +/- 0.155
2,3_imdb_uwcse,nan +/- nan,0.618 +/- 0.114,0.618 +/- 0.111
3,4_uwcse_imdb,nan +/- nan,nan +/- nan,nan +/- nan
4,5_imdb_uwcse,nan +/- nan,0.500 +/- 0.009,0.499 +/- 0.019
5,6_uwcse_imdb,0.845 +/- 0.095,0.845 +/- 0.095,nan +/- nan
6,7_imdb_cora,nan +/- nan,0.603 +/- 0.233,0.674 +/- 0.251
7,8_imdb_cora,0.822 +/- 0.367,0.906 +/- 0.260,0.903 +/- 0.257
8,9_imdb_cora,0.944 +/- 0.008,0.944 +/- 0.008,0.930 +/- 0.035
9,10_imdb_cora,nan +/- nan,0.722 +/- 0.218,0.783 +/- 0.272


# Results for Learning and Revision time

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,3.491 +/- 2.285,8.312 +/- 6.245,5.540 +/- 4.090
1,2_uwcse_imdb,2.135 +/- 2.042,4.392 +/- 3.867,2.479 +/- 1.407
2,3_imdb_uwcse,9.211 +/- 16.222,25.251 +/- 42.025,18.635 +/- 27.361
3,4_uwcse_imdb,1.521 +/- 0.452,4.563 +/- 2.177,1.890 +/- 0.479
4,5_imdb_uwcse,4.063 +/- 3.638,15.342 +/- 9.945,10.989 +/- 7.418
5,6_uwcse_imdb,1.041 +/- 0.409,2.107 +/- 1.146,1.192 +/- 0.604
6,7_imdb_cora,67.706 +/- 102.821,197.865 +/- 259.196,162.324 +/- 123.765
7,8_imdb_cora,121.834 +/- 98.690,330.410 +/- 321.972,225.673 +/- 195.755
8,9_imdb_cora,3.910 +/- 1.723,12.307 +/- 6.040,8.387 +/- 3.911
9,10_imdb_cora,5.638 +/- 4.162,85.507 +/- 247.698,27.506 +/- 56.096


# Results for Inference time

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,3.491 +/- 2.285,0.776 +/- 0.047,0.780 +/- 0.071
1,2_uwcse_imdb,2.135 +/- 2.042,0.854 +/- 0.068,0.785 +/- 0.024
2,3_imdb_uwcse,9.211 +/- 16.222,1.217 +/- 0.069,1.195 +/- 0.230
3,4_uwcse_imdb,1.521 +/- 0.452,1.564 +/- 0.875,0.719 +/- 0.067
4,5_imdb_uwcse,4.063 +/- 3.638,0.881 +/- 0.101,0.939 +/- 0.203
5,6_uwcse_imdb,1.041 +/- 0.409,0.550 +/- 0.019,0.523 +/- 0.018
6,7_imdb_cora,67.706 +/- 102.821,29.422 +/- 70.333,16.017 +/- 26.629
7,8_imdb_cora,121.834 +/- 98.690,6.224 +/- 1.988,5.357 +/- 1.249
8,9_imdb_cora,3.910 +/- 1.723,6.538 +/- 11.322,2.370 +/- 1.108
9,10_imdb_cora,5.638 +/- 4.162,5.766 +/- 5.287,4.450 +/- 8.920


In [155]:
for j in range(len(experiments)):
    dataset = experiments[j]['id'] + '_' + experiments[j]['source'] + '_' + experiments[j]['target']
    display(Markdown('# Results for ' + dataset))
    table = []
    for metric in ['AUC ROC', 'AUC PR', 'CLL', 'Recall', 'F1', 'Precision', 'Learning and Revision time', 'Inference time']:
    #for metric in ['AUC ROC', 'AUC PR']:
        if dataset in data['results']: 
            #for metric in ['AUC ROC', 'AUC PR']:
            display(Markdown('## ' + metric))
            if metric == 'Precision':
                scratch = np.array([item['scratch']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
            elif metric == 'Learning and Revision time':
                scratch = np.array([item['scratch']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
            elif metric == 'Inference time':
                scratch = np.array([item['scratch']['Inference time'] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Inference time'] for sublist in data['results'][str(dataset)] for item in sublist])
            else:
                scratch = np.array([item['scratch'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
                for m in range(len(data['results'][str(dataset)])):
                    experiment = data['results'][str(dataset)][m]
                    print('T-test for experiment %s' % (m+1))
                    print(stats.ttest_rel([item['transfer'][metric] for item in experiment],[item['scratch'][metric] for item in experiment]))
            print('\n')
            print('Scratch: %s' % scratch)
            print('Transfer: %s' % parameter)
            print('Transfer & Revision: %s' % transfer)

# Results for 1_imdb_uwcse

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=1.0624844844094459, pvalue=0.3479054985886356)


Scratch: [0.963429 0.96225  0.866355 0.948125 0.930758]
Transfer: [0.951677 0.952307 0.959689 0.959375 0.956584]
Transfer & Revision: [0.9631   0.959591 0.933617 0.945703 0.94027 ]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=1.130816092033762, pvalue=0.32133967916366135)


Scratch: [0.937107 0.929803 0.774746 0.922869 0.873466]
Transfer: [0.929498 0.931984 0.943146 0.95045  0.939   ]
Transfer & Revision: [0.936386 0.927045 0.880096 0.918773 0.893929]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=0.957348796631256, pvalue=0.392604812907962)


Scratch: [-0.210682 -0.238293 -0.351726 -0.236094 -0.250571]
Transfer: [-0.232353 -0.231667 -0.225631 -0.231815 -0.224265]
Transfer & Revision: [-0.211256 -0.223627 -0.271719 -0.239393 -0.262004]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=0.7022025956586048, pvalue=0.5212637710319327)


Scratch: [1.       0.946237 1.       0.975    1.      ]
Transfer: [1. 1. 1. 1. 1.]
Transfer & Revision: [0.987179 1.       1.       0.975    1.      ]


## F1

T-test for experiment 1
Ttest_relResult(statistic=1.5901219601064347, pvalue=0.18701305773992652)


Scratch: [0.939759 0.926316 0.908297 0.934132 0.941748]
Transfer: [0.939759 0.939394 0.945455 0.941176 0.941748]
Transfer & Revision: [0.944785 0.939394 0.945455 0.934132 0.941748]


## Precision



Scratch: [0.886364 0.907216 0.832    0.896552 0.889908]
Transfer: [0.886364 0.885714 0.896552 0.888889 0.889908]
Transfer & Revision: [0.905882 0.885714 0.896552 0.896552 0.889908]


## Learning and Revision time



Scratch: [6.145 5.745 3.3   8.944 3.566]
Transfer: [3.381 3.62  2.13  5.53  2.793]
Transfer & Revision: [ 7.741  8.719  5.258 14.029  5.814]


## Inference time



Scratch: [0.8   0.79  0.729 0.828 0.751]
Transfer: [3.381 3.62  2.13  5.53  2.793]
Transfer & Revision: [0.773 0.772 0.76  0.821 0.755]


# Results for 2_uwcse_imdb

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=0.9999999999999998, pvalue=0.373900966300059)


Scratch: [0.903675 1.       1.       1.       1.      ]
Transfer: [1. 1. 1. 1. 1.]
Transfer & Revision: [1. 1. 1. 1. 1.]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=0.9999999999999998, pvalue=0.373900966300059)


Scratch: [0.837662 1.       1.       1.       1.      ]
Transfer: [1. 1. 1. 1. 1.]
Transfer & Revision: [1. 1. 1. 1. 1.]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=1.9242268029265577, pvalue=0.12665381637307352)


Scratch: [-0.289355 -0.179521 -0.094637 -0.094637 -0.213649]
Transfer: [-0.120488 -0.120865 -0.094991 -0.121892 -0.122481]
Transfer & Revision: [-0.131448 -0.131246 -0.097349 -0.100829 -0.099876]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=nan, pvalue=nan)


Scratch: [1. 1. 1. 1. 1.]
Transfer: [1. 1. 1. 1. 1.]
Transfer & Revision: [1. 1. 1. 1. 1.]


## F1

T-test for experiment 1
Ttest_relResult(statistic=2.4489985172744877, pvalue=0.0705212895221997)


Scratch: [0.913165 0.913963 1.       1.       0.915761]
Transfer: [1. 1. 1. 1. 1.]
Transfer & Revision: [1. 1. 1. 1. 1.]


## Precision



Scratch: [0.840206 0.841558 1.       1.       0.844612]
Transfer: [1. 1. 1. 1. 1.]
Transfer & Revision: [1. 1. 1. 1. 1.]


## Learning and Revision time



Scratch: [2.131 2.256 3.878 2.024 2.104]
Transfer: [1.412 1.532 4.151 1.678 1.904]
Transfer & Revision: [3.244 3.289 8.248 3.598 3.583]


## Inference time



Scratch: [0.777 0.777 0.776 0.787 0.808]
Transfer: [1.412 1.532 4.151 1.678 1.904]
Transfer & Revision: [0.834 0.875 0.8   0.899 0.86 ]


# Results for 3_imdb_uwcse

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=1.4520439837491346, pvalue=0.22013029574648438)


Scratch: [0.608518 0.59946  0.513122 0.601276 0.699091]
Transfer: [0.625566 0.659607 0.5      0.674538 0.666399]
Transfer & Revision: [0.604264 0.660124 0.513122 0.642957 0.697868]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=1.6029638229984553, pvalue=0.18420494755472522)


Scratch: [0.590933 0.617461 0.509288 0.581197 0.677573]
Transfer: [0.591121 0.622102 0.5      0.640797 0.631753]
Transfer & Revision: [0.595975 0.643038 0.509288 0.591847 0.675766]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=0.8428792747000576, pvalue=0.4467470277222079)


Scratch: [-0.723354 -0.708331 -0.709482 -0.720718 -0.642895]
Transfer: [-0.672444 -0.641436 -0.695026 -0.641755 -0.648465]
Transfer & Revision: [-0.745315 -0.681802 -0.709482 -0.683896 -0.640451]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=1.541215846608618, pvalue=0.19811780685432764)


Scratch: [0.504525 0.388805 0.502762 0.488706 0.586817]
Transfer: [0.68552  0.691377 0.       0.667351 0.670418]
Transfer & Revision: [0.547511 0.388805 0.502762 0.513347 0.586817]


## F1

T-test for experiment 1
Ttest_relResult(statistic=1.6291679838866016, pvalue=0.1786096868735445)


Scratch: [0.55335  0.483992 0.508025 0.559342 0.625536]
Transfer: [0.646745 0.670088      nan 0.672182 0.667734]
Transfer & Revision: [0.57414  0.483992 0.508025 0.578035 0.625536]


## Precision



Scratch: [0.612637 0.640898 0.513399 0.653846 0.669725]
Transfer: [0.612121 0.650071      nan 0.677083 0.665072]
Transfer & Revision: [0.603491 0.640898 0.513399 0.661376 0.669725]


## Learning and Revision time



Scratch: [41.302 11.536  2.695 26.485 11.158]
Transfer: [24.781  6.07   1.614  8.704  4.888]
Transfer & Revision: [63.451 14.686  3.443 30.83  13.847]


## Inference time



Scratch: [1.211 1.331 1.029 1.103 1.301]
Transfer: [24.781  6.07   1.614  8.704  4.888]
Transfer & Revision: [1.173 1.243 1.249 1.244 1.178]


# Results for 4_uwcse_imdb

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=2.021458999083978, pvalue=0.11330925401556155)


Scratch: [0.491661 0.484614 0.480489 0.493003 0.500828]
Transfer: [0.495009 0.49719  0.50014  0.497258 0.49635 ]
Transfer & Revision: [0.493426 0.495735 0.483937 0.504647 0.499288]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=0.49343147501913087, pvalue=0.6475716911775729)


Scratch: [0.495022 0.489343 0.487267 0.494273 0.499097]
Transfer: [0.496868 0.498056 0.502391 0.498147 0.488913]
Transfer & Revision: [0.495492 0.493126 0.493919 0.498581 0.490479]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=-0.3396733792342669, pvalue=0.7511886311248439)


Scratch: [-0.699092 -0.69806  -0.703178 -0.718411 -0.716119]
Transfer: [-0.697378 -0.694501 -0.696145 -0.69453  -0.720515]
Transfer & Revision: [-0.699609 -0.697473 -0.704065 -0.712621 -0.725125]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)


Scratch: [0.342342 0.       0.549107 0.405063 0.126582]
Transfer: [0.       0.       0.066964 0.       0.126582]
Transfer & Revision: [0.342342 0.       0.616071 0.405063 0.126582]


## F1

T-test for experiment 1
Ttest_relResult(statistic=nan, pvalue=nan)


Scratch: [0.404255      nan 0.51357  0.443418 0.201342]
Transfer: [     nan      nan 0.118577      nan 0.201342]
Transfer & Revision: [0.404255      nan 0.543307 0.443418 0.201342]


## Precision



Scratch: [0.493506      nan 0.482353 0.489796 0.491803]
Transfer: [     nan      nan 0.517241      nan 0.491803]
Transfer & Revision: [0.493506      nan 0.485915 0.489796 0.491803]


## Learning and Revision time



Scratch: [1.752 1.813 2.365 1.725 1.794]
Transfer: [1.758 1.157 1.678 1.649 1.362]
Transfer & Revision: [4.996 3.867 6.332 4.515 3.106]


## Inference time



Scratch: [0.744 0.743 0.673 0.683 0.751]
Transfer: [1.758 1.157 1.678 1.649 1.362]
Transfer & Revision: [1.975 1.972 1.413 1.662 0.797]


# Results for 5_imdb_uwcse

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=-0.45510204754833655, pvalue=0.6726429020204927)


Scratch: [0.483293 0.518781 0.500118 0.50925  0.491703]
Transfer: [0.5 0.5 0.5 0.5 0.5]
Transfer & Revision: [0.493294 0.511096 0.500947 0.49835  0.491173]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=-0.7550711961393666, pvalue=0.4922278896841665)


Scratch: [0.491081 0.50829  0.508873 0.514292 0.501426]
Transfer: [0.5 0.5 0.5 0.5 0.5]
Transfer & Revision: [0.492195 0.5032   0.509704 0.504048 0.505231]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=2.294453932932237, pvalue=0.08344678590612374)


Scratch: [-0.715178 -0.705998 -0.714844 -0.710959 -0.741741]
Transfer: [-0.695026 -0.695026 -0.695026 -0.695026 -0.695026]
Transfer & Revision: [-0.711561 -0.705846 -0.71281  -0.709257 -0.733649]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=1.5525419762174137, pvalue=0.1954871628573297)


Scratch: [0.505376 0.347458 0.415385 0.48     0.285714]
Transfer: [0. 0. 0. 0. 0.]
Transfer & Revision: [0.516129 0.5      0.461538 0.49     0.285714]


## F1

T-test for experiment 1
Ttest_relResult(statistic=1.5739913401498271, pvalue=0.19060310531380512)


Scratch: [0.497354 0.41206  0.448133 0.494845 0.363636]
Transfer: [nan nan nan nan nan]
Transfer & Revision: [0.507937 0.502128 0.47619  0.497462 0.363636]


## Precision



Scratch: [0.489583 0.506173 0.486486 0.510638 0.5     ]
Transfer: [nan nan nan nan nan]
Transfer & Revision: [0.5      0.504274 0.491803 0.505155 0.5     ]


## Learning and Revision time



Scratch: [11.395 12.695  3.807 12.721 14.326]
Transfer: [3.381 2.738 2.103 4.9   7.191]
Transfer & Revision: [19.983 17.591  5.725 16.068 17.345]


## Inference time



Scratch: [0.855 1.046 0.823 0.896 1.073]
Transfer: [3.381 2.738 2.103 4.9   7.191]
Transfer & Revision: [0.855 0.928 0.8   0.885 0.938]


# Results for 6_uwcse_imdb

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)


Scratch: [0.875    0.885714 0.965517 0.906977 0.5     ]
Transfer: [0.875    0.885714 0.965517 0.906977 0.9     ]
Transfer & Revision: [0.875    0.885714 0.965517 0.906977 0.9     ]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)


Scratch: [0.8      0.813953 0.935484 0.843137 0.5     ]
Transfer: [0.8      0.813953 0.935484 0.843137 0.833333]
Transfer & Revision: [0.8      0.813953 0.935484 0.843137 0.833333]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)


Scratch: [-0.352709 -0.320018 -0.264596 -0.300536 -1.052978]
Transfer: [-0.35253  -0.323511 -0.273236 -0.307206 -0.303054]
Transfer & Revision: [-0.352709 -0.320018 -0.264596 -0.300536 -0.299463]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)


Scratch: [1. 1. 1. 1. 0.]
Transfer: [1. 1. 1. 1. 1.]
Transfer & Revision: [1. 1. 1. 1. 1.]


## F1

T-test for experiment 1
Ttest_relResult(statistic=nan, pvalue=nan)


Scratch: [0.888889 0.897436 0.966667 0.914894      nan]
Transfer: [0.888889 0.897436 0.966667 0.914894 0.909091]
Transfer & Revision: [0.888889 0.897436 0.966667 0.914894 0.909091]


## Precision



Scratch: [0.8      0.813953 0.935484 0.843137      nan]
Transfer: [0.8      0.813953 0.935484 0.843137 0.833333]
Transfer & Revision: [0.8      0.813953 0.935484 0.843137 0.833333]


## Learning and Revision time



Scratch: [1.211 1.357 1.624 1.044 0.723]
Transfer: [1.074 1.059 1.393 0.877 0.803]
Transfer & Revision: [1.933 2.39  3.073 1.667 1.472]


## Inference time



Scratch: [0.509 0.524 0.522 0.538 0.523]
Transfer: [1.074 1.059 1.393 0.877 0.803]
Transfer & Revision: [0.539 0.562 0.551 0.56  0.54 ]


# Results for 7_imdb_cora

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=-1.0924589889945526, pvalue=0.33601639375602715)


Scratch: [0.853829 0.554561 0.858227 0.58278  0.542732]
Transfer: [0.546475 0.437142 0.547299 0.558035 0.535236]
Transfer & Revision: [0.861173 0.546298 0.555388 0.562968 0.540767]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=-1.1390907300496613, pvalue=0.3182514610040248)


Scratch: [0.806379 0.528199 0.8113   0.596506 0.56526 ]
Transfer: [0.552575 0.443375 0.555563 0.56414  0.542776]
Transfer & Revision: [0.823759 0.516014 0.564292 0.563819 0.563018]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=-0.9661334850677126, pvalue=0.3886879861450788)


Scratch: [-0.461551 -0.704582 -0.482109 -0.675534 -0.689584]
Transfer: [-0.684943 -0.710286 -0.684914 -0.686242 -0.685676]
Transfer & Revision: [-0.448797 -0.707285 -0.673539 -0.679388 -0.691016]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=-1.6664307302499766, pvalue=0.1709560816741884)


Scratch: [0.919215 0.956812 0.945813 0.104405 0.941224]
Transfer: [0.94413  1.       0.944992 0.       0.952169]
Transfer & Revision: [0.9094   0.954586 0.945402 0.051982 0.927037]


## F1

T-test for experiment 1
Ttest_relResult(statistic=-1.5350177170980004, pvalue=0.19957272893964093)


Scratch: [0.869488 0.68702  0.874549 0.179954 0.689737]
Transfer: [0.697726 0.671651 0.700335      nan 0.691798]
Transfer & Revision: [0.871248 0.687179 0.701706 0.094893 0.683298]


## Precision



Scratch: [0.824864 0.53591  0.813272 0.651099 0.544304]
Transfer: [0.553319 0.505628 0.556307      nan 0.543247]
Transfer & Revision: [0.836168 0.536805 0.557897 0.543779 0.541046]


## Learning and Revision time



Scratch: [269.387 150.995 111.778 184.341  95.117]
Transfer: [163.855  51.02   12.692  69.021  41.941]
Transfer & Revision: [435.206 199.211  46.544 175.758 132.605]


## Inference time



Scratch: [40.527  5.953 19.929  7.364  6.312]
Transfer: [163.855  51.02   12.692  69.021  41.941]
Transfer & Revision: [96.125  6.374  4.559  5.739 34.311]


# Results for 8_imdb_cora

# Results for 9_imdb_cora

# Results for 10_imdb_cora

# Results for 11_uwcse_cora

# Results for 12_uwcse_cora

# Results for 13_uwcse_cora

# Results for 14_uwcse_cora

# Results for 15_yeast_twitter

# Results for 16_yeast_twitter

# Results for 17_yeast_twitter

# Results for 18_yeast_twitter

# Results for 19_yeast_twitter

# Results for 20_yeast_twitter

# Results for 21_yeast_twitter

# Results for 22_twitter_yeast

# Results for 23_twitter_yeast

# Results for 24_twitter_yeast

# Results for 25_twitter_yeast

# Results for 26_twitter_yeast

# Results for 27_twitter_yeast

# Results for 28_twitter_yeast