In [9]:
import matplotlib.pyplot as plt
from IPython.display import display, Markdown, Latex
import numpy as np
import json
import pandas as pd
from scipy import stats

with open('transfer_experiment.json', 'r') as fp:
    data = json.load(fp)

In [10]:
experiments = [
            {'id': '1', 'source':'imdb', 'target':'uwcse', 'predicate':'workedunder', 'to_predicate':'advisedby'},
            {'id': '2', 'source':'uwcse', 'target':'imdb', 'predicate':'advisedby', 'to_predicate':'workedunder'},
            {'id': '3', 'source':'imdb', 'target':'uwcse', 'predicate':'movie', 'to_predicate':'publication'},
            {'id': '4', 'source':'uwcse', 'target':'imdb', 'predicate':'publication', 'to_predicate':'movie'},
            {'id': '5', 'source':'imdb', 'target':'uwcse', 'predicate':'genre', 'to_predicate':'inphase'},
            {'id': '6', 'source':'uwcse', 'target':'imdb', 'predicate':'inphase', 'to_predicate':'genre'},
            {'id': '7', 'source':'imdb', 'target':'cora', 'predicate':'workedunder', 'to_predicate':'samevenue'},
            {'id': '8', 'source':'imdb', 'target':'cora', 'predicate':'workedunder', 'to_predicate':'samebib'},
            {'id': '9', 'source':'imdb', 'target':'cora', 'predicate':'workedunder', 'to_predicate':'sameauthor'},
            {'id': '10', 'source':'imdb', 'target':'cora', 'predicate':'workedunder', 'to_predicate':'sametitle'},
            {'id': '11', 'source':'uwcse', 'target':'cora', 'predicate':'advisedby', 'to_predicate':'samevenue'},
            {'id': '12', 'source':'uwcse', 'target':'cora', 'predicate':'advisedby', 'to_predicate':'samebib'},
            {'id': '13', 'source':'uwcse', 'target':'cora', 'predicate':'advisedby', 'to_predicate':'sameauthor'},
            {'id': '14', 'source':'uwcse', 'target':'cora', 'predicate':'advisedby', 'to_predicate':'sametitle'},
            {'id': '15', 'source':'yeast', 'target':'twitter', 'predicate':'proteinclass', 'to_predicate':'accounttype'},
            {'id': '16', 'source':'yeast', 'target':'twitter', 'predicate':'interaction', 'to_predicate':'follows'},
            {'id': '17', 'source':'yeast', 'target':'twitter', 'predicate':'location', 'to_predicate':'tweets'},
            {'id': '18', 'source':'yeast', 'target':'twitter', 'predicate':'enzyme', 'to_predicate':'tweets'},
            {'id': '19', 'source':'yeast', 'target':'twitter', 'predicate':'function', 'to_predicate':'tweets'},
            {'id': '20', 'source':'yeast', 'target':'twitter', 'predicate':'phenotype', 'to_predicate':'tweets'},
            {'id': '21', 'source':'yeast', 'target':'twitter', 'predicate':'complex', 'to_predicate':'tweets'},
            {'id': '22', 'source':'twitter', 'target':'yeast', 'predicate':'accounttype', 'to_predicate':'proteinclass'},
            {'id': '23', 'source':'twitter', 'target':'yeast', 'predicate':'follows', 'to_predicate':'interaction'},
            {'id': '24', 'source':'twitter', 'target':'yeast', 'predicate':'tweets', 'to_predicate':'location'},
            {'id': '25', 'source':'twitter', 'target':'yeast', 'predicate':'tweets', 'to_predicate':'enzyme'},
            {'id': '26', 'source':'twitter', 'target':'yeast', 'predicate':'tweets', 'to_predicate':'function'},
            {'id': '27', 'source':'twitter', 'target':'yeast', 'predicate':'tweets', 'to_predicate':'phenotype'},
            {'id': '28', 'source':'twitter', 'target':'yeast', 'predicate':'tweets', 'to_predicate':'complex'},
            {'id': '29', 'source':'nell_sports', 'target':'nell_finances', 'predicate':'teamalsoknownas', 'to_predicate':'companyalsoknownas'},
            {'id': '30', 'source':'nell_sports', 'target':'nell_finances', 'predicate':'teamplaysagainstteam', 'to_predicate':'companyalsoknownas'},
            {'id': '31', 'source':'nell_sports', 'target':'nell_finances', 'predicate':'teamplaysagainstteam', 'to_predicate':'acquired'},
            {'id': '32', 'source':'nell_sports', 'target':'nell_finances', 'predicate':'teamplaysagainstteam', 'to_predicate':'bankboughtbank'},
            {'id': '33', 'source':'nell_sports', 'target':'nell_finances', 'predicate':'athleteplayssport', 'to_predicate':'companyceo'},
            {'id': '34', 'source':'nell_sports', 'target':'nell_finances', 'predicate':'athleteplayssport', 'to_predicate':'bankchiefexecutiveceo'},
            {'id': '35', 'source':'nell_sports', 'target':'nell_finances', 'predicate':'athleteplaysforteam', 'to_predicate':'bankchiefexecutiveceo'},
            {'id': '36', 'source':'nell_sports', 'target':'nell_finances', 'predicate':'athleteplaysforteam', 'to_predicate':'companyceo'},
            {'id': '37', 'source':'nell_sports', 'target':'nell_finances', 'predicate':'teamplayssport', 'to_predicate':'companyeconomicsector'},
            {'id': '38', 'source':'nell_finances', 'target':'nell_sports', 'predicate':'companyalsoknownas', 'to_predicate':'teamalsoknownas'},
            {'id': '39', 'source':'nell_finances', 'target':'nell_sports', 'predicate':'companyalsoknownas', 'to_predicate':'teamplaysagainstteam'},
            {'id': '40', 'source':'nell_finances', 'target':'nell_sports', 'predicate':'acquired', 'to_predicate':'teamplaysagainstteam'},
            {'id': '41', 'source':'nell_finances', 'target':'nell_sports', 'predicate':'bankboughtbank', 'to_predicate':'teamplaysagainstteam'},
            {'id': '42', 'source':'nell_finances', 'target':'nell_sports', 'predicate':'companyceo', 'to_predicate':'athleteplayssport'},
            {'id': '43', 'source':'nell_finances', 'target':'nell_sports', 'predicate':'bankchiefexecutiveceo', 'to_predicate':'athleteplayssport'},
            {'id': '44', 'source':'nell_finances', 'target':'nell_sports', 'predicate':'bankchiefexecutiveceo', 'to_predicate':'athleteplaysforteam'},
            {'id': '45', 'source':'nell_finances', 'target':'nell_sports', 'predicate':'companyceo', 'to_predicate':'athleteplaysforteam'},
            {'id': '46', 'source':'nell_finances', 'target':'nell_sports', 'predicate':'companyeconomicsector', 'to_predicate':'teamplayssport'},
]

for metric in ['AUC ROC', 'AUC PR', 'CLL', 'Recall', 'F1', 'Precision', 'Learning and Revision time', 'Inference time']:
    display(Markdown('# Results for ' + metric))
    table = []
    for j in range(len(experiments)):
        dataset = experiments[j]['id'] + '_' + experiments[j]['source'] + '_' + experiments[j]['target']
        if dataset in data['results']: 
            #for metric in ['AUC ROC', 'AUC PR']:
                #display(Markdown('## ' + metric))
            if metric == 'Precision':
                scratch = np.array([item['scratch']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
            elif metric == 'Learning and Revision time':
                scratch = np.array([item['scratch']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
            elif metric == 'Inference time':
                scratch = np.array([item['scratch']['Inference time'] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Inference time'] for sublist in data['results'][str(dataset)] for item in sublist])
            else:
                scratch = np.array([item['scratch'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
            table.append([dataset, '%.3f +/- %.3f' % (parameter.mean(), 2 * parameter.std()),
            '%.3f +/- %.3f' % (transfer.mean(), 2 * transfer.std()),
            '%.3f +/- %.3f' % (scratch.mean(), 2 * scratch.std())])
    display(pd.DataFrame(table, columns=['Experiment', 'Transfer Learning', 'Transfer Learning with Revision Theory', 'Learning from scratch']))

# Results for AUC ROC

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,0.956 +/- 0.007,0.949 +/- 0.024,0.934 +/- 0.072
1,2_uwcse_imdb,0.999 +/- 0.006,1.000 +/- 0.000,0.981 +/- 0.077
2,6_uwcse_imdb,0.907 +/- 0.063,0.907 +/- 0.063,0.827 +/- 0.333
3,35_nell_sports_nell_finances,0.823 +/- 0.167,0.778 +/- 0.084,0.675 +/- 0.199
4,37_nell_sports_nell_finances,0.795 +/- 0.041,0.840 +/- 0.044,0.702 +/- 0.074


# Results for AUC PR

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,0.939 +/- 0.015,0.912 +/- 0.044,0.885 +/- 0.119
1,2_uwcse_imdb,0.999 +/- 0.008,1.000 +/- 0.000,0.968 +/- 0.130
2,6_uwcse_imdb,0.845 +/- 0.095,0.845 +/- 0.095,0.779 +/- 0.294
3,35_nell_sports_nell_finances,0.864 +/- 0.119,0.821 +/- 0.049,0.712 +/- 0.239
4,37_nell_sports_nell_finances,0.793 +/- 0.035,0.837 +/- 0.046,0.728 +/- 0.063


# Results for CLL

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,-0.229 +/- 0.007,-0.241 +/- 0.046,-0.260 +/- 0.096
1,2_uwcse_imdb,-0.141 +/- 0.135,-0.125 +/- 0.033,-0.174 +/- 0.148
2,6_uwcse_imdb,-0.316 +/- 0.046,-0.307 +/- 0.058,-0.458 +/- 0.598
3,35_nell_sports_nell_finances,-0.535 +/- 0.123,-0.596 +/- 0.130,-0.704 +/- 0.142
4,37_nell_sports_nell_finances,-0.549 +/- 0.039,-0.521 +/- 0.029,-0.621 +/- 0.027


# Results for Recall

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,1.000 +/- 0.000,0.992 +/- 0.020,0.982 +/- 0.050
1,2_uwcse_imdb,1.000 +/- 0.000,1.000 +/- 0.000,1.000 +/- 0.000
2,6_uwcse_imdb,1.000 +/- 0.000,1.000 +/- 0.000,0.800 +/- 0.800
3,35_nell_sports_nell_finances,0.655 +/- 0.430,0.710 +/- 0.314,0.603 +/- 0.347
4,37_nell_sports_nell_finances,0.703 +/- 0.150,0.692 +/- 0.167,0.251 +/- 0.096


# Results for F1

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,0.942 +/- 0.004,0.941 +/- 0.010,0.929 +/- 0.025
1,2_uwcse_imdb,0.998 +/- 0.010,0.997 +/- 0.018,0.949 +/- 0.084
2,6_uwcse_imdb,0.915 +/- 0.054,0.915 +/- 0.054,nan +/- nan
3,35_nell_sports_nell_finances,0.721 +/- 0.326,0.696 +/- 0.120,0.601 +/- 0.217
4,37_nell_sports_nell_finances,0.729 +/- 0.069,0.749 +/- 0.064,0.392 +/- 0.118


# Results for Precision

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,0.889 +/- 0.008,0.894 +/- 0.015,0.882 +/- 0.052
1,2_uwcse_imdb,0.997 +/- 0.020,0.994 +/- 0.035,0.905 +/- 0.155
2,6_uwcse_imdb,0.845 +/- 0.095,0.845 +/- 0.095,nan +/- nan
3,35_nell_sports_nell_finances,0.852 +/- 0.104,0.730 +/- 0.234,0.619 +/- 0.178
4,37_nell_sports_nell_finances,0.766 +/- 0.098,0.830 +/- 0.116,0.918 +/- 0.039


# Results for Learning and Revision time

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,6.130 +/- 5.404,11.840 +/- 8.297,7.013 +/- 4.688
1,2_uwcse_imdb,2.802 +/- 2.617,7.169 +/- 10.850,4.290 +/- 5.430
2,6_uwcse_imdb,1.500 +/- 0.993,2.707 +/- 1.463,2.351 +/- 6.096
3,35_nell_sports_nell_finances,2.362 +/- 0.938,5.632 +/- 2.865,3.486 +/- 2.203
4,37_nell_sports_nell_finances,23.341 +/- 27.499,41.116 +/- 40.507,13.779 +/- 10.957


# Results for Inference time

Unnamed: 0,Experiment,Transfer Learning,Transfer Learning with Revision Theory,Learning from scratch
0,1_imdb_uwcse,6.130 +/- 5.404,1.024 +/- 0.685,0.845 +/- 0.314
1,2_uwcse_imdb,2.802 +/- 2.617,1.178 +/- 0.657,0.991 +/- 0.390
2,6_uwcse_imdb,1.500 +/- 0.993,0.704 +/- 0.604,0.614 +/- 0.265
3,35_nell_sports_nell_finances,2.362 +/- 0.938,0.835 +/- 0.336,0.738 +/- 0.160
4,37_nell_sports_nell_finances,23.341 +/- 27.499,2.269 +/- 1.192,1.468 +/- 0.276


In [11]:
for j in range(len(experiments)):
    dataset = experiments[j]['id'] + '_' + experiments[j]['source'] + '_' + experiments[j]['target']
    display(Markdown('# Results for ' + dataset))
    table = []
    for metric in ['AUC ROC', 'AUC PR', 'CLL', 'Recall', 'F1', 'Precision', 'Learning and Revision time', 'Inference time']:
    #for metric in ['AUC ROC', 'AUC PR']:
        if dataset in data['results']: 
            #for metric in ['AUC ROC', 'AUC PR']:
            display(Markdown('## ' + metric))
            if metric == 'Precision':
                scratch = np.array([item['scratch']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Precision'][0] for sublist in data['results'][str(dataset)] for item in sublist])
            elif metric == 'Learning and Revision time':
                scratch = np.array([item['scratch']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
            elif metric == 'Inference time':
                scratch = np.array([item['scratch']['Inference time'] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results']['Learning time'] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer']['Inference time'] for sublist in data['results'][str(dataset)] for item in sublist])
            else:
                scratch = np.array([item['scratch'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
                parameter = np.array([item['transfer']['Parameter Learning results'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
                transfer = np.array([item['transfer'][metric] for sublist in data['results'][str(dataset)] for item in sublist])
                for m in range(len(data['results'][str(dataset)])):
                    print('T-test for experiment %s' % (m+1))
                    pvalue = stats.ttest_rel([item['transfer'][metric] for item in data['results'][str(dataset)][m]],[item['scratch'][metric] for item in data['results'][str(dataset)][m]])
                    print(pvalue)
                    pvalue_table = []
                    pvalue_table.append(['transferRDN-B Ref', '%.3f' % (pvalue[1])])
                    pvalue = stats.ttest_rel([item['transfer']['Parameter Learning results'][metric] for item in data['results'][str(dataset)][m]],[item['scratch'][metric] for item in data['results'][str(dataset)][m]])
                    print(pvalue)
                    pvalue_table.append(['transferRDN-B', '%.3f' % (pvalue[1])])
                    display(pd.DataFrame(pvalue_table, columns=['p-value', 'RDN-B']))
            print('\n')
            print('Scratch: %s' % scratch)
            print('Transfer: %s' % parameter)
            print('Transfer & Revision: %s' % transfer)

# Results for 1_imdb_uwcse

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=1.1917929053992558, pvalue=0.29921800189982484)
Ttest_relResult(statistic=1.1614017476693, pvalue=0.31006055071110605)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.299
1,transferRDN-B,0.31


T-test for experiment 2
Ttest_relResult(statistic=1.134631277812482, pvalue=0.3199123877810134)
Ttest_relResult(statistic=1.1553158060926152, pvalue=0.31227528404301436)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.32
1,transferRDN-B,0.312




Scratch: [0.963922 0.963175 0.866355 0.94375  0.930758 0.962278 0.963175 0.866355
 0.946484 0.930758]
Transfer: [0.951677 0.952307 0.959689 0.959375 0.956584 0.951677 0.952307 0.959689
 0.959375 0.956584]
Transfer & Revision: [0.96573  0.959591 0.933617 0.946719 0.94027  0.964826 0.959591 0.933617
 0.945859 0.94027 ]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=1.4684922708408426, pvalue=0.21589128550918935)
Ttest_relResult(statistic=1.7349502513037778, pvalue=0.15776662417341303)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.216
1,transferRDN-B,0.158


T-test for experiment 2
Ttest_relResult(statistic=1.2342674649960061, pvalue=0.284659660327558)
Ttest_relResult(statistic=1.6595028948791966, pvalue=0.17235266512054795)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.285
1,transferRDN-B,0.172




Scratch: [0.938046 0.93149  0.774746 0.901867 0.873466 0.932796 0.93149  0.774746
 0.919846 0.873466]
Transfer: [0.929498 0.931984 0.943146 0.95045  0.939    0.929498 0.931984 0.943146
 0.95045  0.939   ]
Transfer & Revision: [0.942244 0.927045 0.880096 0.920731 0.893929 0.938697 0.927045 0.880096
 0.918908 0.893929]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=1.2170089980206813, pvalue=0.29049248798508615)
Ttest_relResult(statistic=1.2307991843955208, pvalue=0.2858228417037599)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.29
1,transferRDN-B,0.286


T-test for experiment 2
Ttest_relResult(statistic=1.131132180844137, pvalue=0.3212212059608435)
Ttest_relResult(statistic=1.2119497029010058, pvalue=0.29222369592431313)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.321
1,transferRDN-B,0.292




Scratch: [-0.210682 -0.247882 -0.351726 -0.239378 -0.250571 -0.211385 -0.247882
 -0.351726 -0.236668 -0.250571]
Transfer: [-0.232353 -0.231667 -0.225631 -0.231815 -0.224265 -0.232353 -0.231667
 -0.225631 -0.231815 -0.224265]
Transfer & Revision: [-0.2089   -0.223627 -0.271719 -0.235797 -0.262004 -0.210545 -0.223627
 -0.271719 -0.237443 -0.262004]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=0.7508391392284557, pvalue=0.4945066522512446)
Ttest_relResult(statistic=1.4187699559636175, pvalue=0.22896287255263786)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.495
1,transferRDN-B,0.229


T-test for experiment 2
Ttest_relResult(statistic=0.7508391392284557, pvalue=0.4945066522512446)
Ttest_relResult(statistic=1.4187699559636175, pvalue=0.22896287255263786)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.495
1,transferRDN-B,0.229




Scratch: [1.       0.935484 1.       0.975    1.       1.       0.935484 1.
 0.975    1.      ]
Transfer: [1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]
Transfer & Revision: [0.987179 1.       1.       0.975    1.       0.987179 1.       1.
 0.975    1.      ]


## F1

T-test for experiment 1
Ttest_relResult(statistic=1.444862319246458, pvalue=0.22200730294727936)
Ttest_relResult(statistic=1.790304165161057, pvalue=0.14789823332561916)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.222
1,transferRDN-B,0.148


T-test for experiment 2
Ttest_relResult(statistic=1.7108868242063406, pvalue=0.16227212856544418)
Ttest_relResult(statistic=1.790304165161057, pvalue=0.14789823332561916)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.162
1,transferRDN-B,0.148




Scratch: [0.939759 0.920635 0.908297 0.934132 0.941748 0.939759 0.920635 0.908297
 0.934132 0.941748]
Transfer: [0.939759 0.939394 0.945455 0.941176 0.941748 0.939759 0.939394 0.945455
 0.941176 0.941748]
Transfer & Revision: [0.944785 0.939394 0.945455 0.928571 0.941748 0.944785 0.939394 0.945455
 0.934132 0.941748]


## Precision



Scratch: [0.886364 0.90625  0.832    0.896552 0.889908 0.886364 0.90625  0.832
 0.896552 0.889908]
Transfer: [0.886364 0.885714 0.896552 0.888889 0.889908 0.886364 0.885714 0.896552
 0.888889 0.889908]
Transfer & Revision: [0.905882 0.885714 0.896552 0.886364 0.889908 0.905882 0.885714 0.896552
 0.896552 0.889908]


## Learning and Revision time



Scratch: [ 8.582  9.099  4.511 11.407  5.165  6.794  6.763  3.763  9.082  4.967]
Transfer: [ 4.442  7.751 11.916  9.409  6.629  3.86   5.409  2.907  5.378  3.597]
Transfer & Revision: [ 9.761 16.505 15.469 19.441 10.068  8.482 10.541  6.683 14.593  6.859]


## Inference time



Scratch: [0.765 1.299 0.796 0.848 0.794 0.759 0.878 0.735 0.815 0.758]
Transfer: [ 4.442  7.751 11.916  9.409  6.629  3.86   5.409  2.907  5.378  3.597]
Transfer & Revision: [0.927 1.922 1.381 0.847 0.818 0.803 0.878 0.804 0.829 1.029]


# Results for 2_uwcse_imdb

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=0.9999999999999998, pvalue=0.373900966300059)
Ttest_relResult(statistic=0.9999999999999998, pvalue=0.373900966300059)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.374


T-test for experiment 2
Ttest_relResult(statistic=0.9999999999999998, pvalue=0.373900966300059)
Ttest_relResult(statistic=0.8648408992340092, pvalue=0.435909369271908)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.436




Scratch: [0.903675 1.       1.       1.       1.       0.903675 1.       1.
 1.       1.      ]
Transfer: [1.       1.       1.       1.       1.       1.       1.       0.989655
 1.       1.      ]
Transfer & Revision: [1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=0.9999999999999998, pvalue=0.373900966300059)
Ttest_relResult(statistic=0.9999999999999998, pvalue=0.373900966300059)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.374


T-test for experiment 2
Ttest_relResult(statistic=0.9999999999999998, pvalue=0.373900966300059)
Ttest_relResult(statistic=0.898501355359513, pvalue=0.4197148545394023)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.42




Scratch: [0.837662 1.       1.       1.       1.       0.837662 1.       1.
 1.       1.      ]
Transfer: [1.       1.       1.       1.       1.       1.       1.       0.986901
 1.       1.      ]
Transfer & Revision: [1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=1.3856978633473873, pvalue=0.23809220803766912)
Ttest_relResult(statistic=1.5669459424512866, pvalue=0.192193358384968)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.238
1,transferRDN-B,0.192


T-test for experiment 2
Ttest_relResult(statistic=1.5048287213993148, pvalue=0.2068167259881989)
Ttest_relResult(statistic=0.16726753053797272, pvalue=0.8752752532511838)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.207
1,transferRDN-B,0.875




Scratch: [-0.289355 -0.179547 -0.094637 -0.094637 -0.213649 -0.289355 -0.179547
 -0.094637 -0.094637 -0.213649]
Transfer: [-0.125718 -0.126244 -0.098728 -0.12804  -0.116906 -0.121506 -0.121913
 -0.341716 -0.120532 -0.105816]
Transfer & Revision: [-0.140467 -0.142245 -0.097161 -0.134758 -0.126925 -0.134555 -0.134478
 -0.097894 -0.133249 -0.105495]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=nan, pvalue=nan)
Ttest_relResult(statistic=nan, pvalue=nan)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,
1,transferRDN-B,


T-test for experiment 2
Ttest_relResult(statistic=nan, pvalue=nan)
Ttest_relResult(statistic=nan, pvalue=nan)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,
1,transferRDN-B,




Scratch: [1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]
Transfer: [1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]
Transfer & Revision: [1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]


## F1

T-test for experiment 1
Ttest_relResult(statistic=2.3332880372203038, pvalue=0.0799636124595334)
Ttest_relResult(statistic=2.4489985172744877, pvalue=0.0705212895221997)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.08
1,transferRDN-B,0.071


T-test for experiment 2
Ttest_relResult(statistic=2.4489985172744877, pvalue=0.0705212895221997)
Ttest_relResult(statistic=2.0696129836028474, pvalue=0.10727717991713963)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.071
1,transferRDN-B,0.107




Scratch: [0.913165 0.913963 1.       1.       0.915761 0.913165 0.913963 1.
 1.       0.915761]
Transfer: [1.       1.       1.       1.       1.       1.       1.       0.983133
 1.       1.      ]
Transfer & Revision: [1.       1.       1.       1.       0.969784 1.       1.       1.
 1.       1.      ]


## Precision



Scratch: [0.840206 0.841558 1.       1.       0.844612 0.840206 0.841558 1.
 1.       0.844612]
Transfer: [1.       1.       1.       1.       1.       1.       1.       0.966825
 1.       1.      ]
Transfer & Revision: [1.       1.       1.       1.       0.941341 1.       1.       1.
 1.       1.      ]


## Learning and Revision time



Scratch: [ 3.41   8.46  10.399  3.811  2.749  2.456  2.989  4.62   1.901  2.109]
Transfer: [2.168 2.513 6.473 2.945 2.529 1.694 2.447 3.304 2.174 1.772]
Transfer & Revision: [ 3.995 21.72  11.46   5.425  5.165  3.37   4.186  8.598  4.107  3.666]


## Inference time



Scratch: [1.002 1.291 0.759 0.823 0.791 0.79  1.117 1.214 0.902 1.224]
Transfer: [2.168 2.513 6.473 2.945 2.529 1.694 2.447 3.304 2.174 1.772]
Transfer & Revision: [1.935 1.116 0.993 0.896 0.996 1.63  1.224 0.842 1.164 0.985]


# Results for 3_imdb_uwcse

# Results for 4_uwcse_imdb

# Results for 5_imdb_uwcse

# Results for 6_uwcse_imdb

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.374


T-test for experiment 2
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.374




Scratch: [0.875    0.885714 0.965517 0.906977 0.5      0.875    0.885714 0.965517
 0.906977 0.5     ]
Transfer: [0.875    0.885714 0.965517 0.906977 0.9      0.875    0.885714 0.965517
 0.906977 0.9     ]
Transfer & Revision: [0.875    0.885714 0.965517 0.906977 0.9      0.875    0.885714 0.965517
 0.906977 0.9     ]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.374


T-test for experiment 2
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.374




Scratch: [0.8      0.813953 0.935484 0.843137 0.5      0.8      0.813953 0.935484
 0.843137 0.5     ]
Transfer: [0.8      0.813953 0.935484 0.843137 0.833333 0.8      0.813953 0.935484
 0.843137 0.833333]
Transfer & Revision: [0.8      0.813953 0.935484 0.843137 0.833333 0.8      0.813953 0.935484
 0.843137 0.833333]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)
Ttest_relResult(statistic=0.9370088998261259, pvalue=0.4018030398979859)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.402


T-test for experiment 2
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)
Ttest_relResult(statistic=0.9340127580731116, pvalue=0.40317328068072483)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.403




Scratch: [-0.352709 -0.320018 -0.264596 -0.300536 -1.052978 -0.352709 -0.320018
 -0.264596 -0.300536 -1.052978]
Transfer: [-0.351932 -0.326947 -0.282685 -0.314344 -0.304933 -0.352356 -0.327349
 -0.283226 -0.314791 -0.305401]
Transfer & Revision: [-0.352709 -0.320018 -0.264596 -0.300536 -0.299128 -0.352709 -0.320018
 -0.264596 -0.300536 -0.299128]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.374


T-test for experiment 2
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)
Ttest_relResult(statistic=1.0, pvalue=0.373900966300059)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.374
1,transferRDN-B,0.374




Scratch: [1. 1. 1. 1. 0. 1. 1. 1. 1. 0.]
Transfer: [1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]
Transfer & Revision: [1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]


## F1

T-test for experiment 1
Ttest_relResult(statistic=nan, pvalue=nan)
Ttest_relResult(statistic=nan, pvalue=nan)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,
1,transferRDN-B,


T-test for experiment 2
Ttest_relResult(statistic=nan, pvalue=nan)
Ttest_relResult(statistic=nan, pvalue=nan)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,
1,transferRDN-B,




Scratch: [0.888889 0.897436 0.966667 0.914894      nan 0.888889 0.897436 0.966667
 0.914894      nan]
Transfer: [0.888889 0.897436 0.966667 0.914894 0.909091 0.888889 0.897436 0.966667
 0.914894 0.909091]
Transfer & Revision: [0.888889 0.897436 0.966667 0.914894 0.909091 0.888889 0.897436 0.966667
 0.914894 0.909091]


## Precision



Scratch: [0.8      0.813953 0.935484 0.843137      nan 0.8      0.813953 0.935484
 0.843137      nan]
Transfer: [0.8      0.813953 0.935484 0.843137 0.833333 0.8      0.813953 0.935484
 0.843137 0.833333]
Transfer & Revision: [0.8      0.813953 0.935484 0.843137 0.833333 0.8      0.813953 0.935484
 0.843137 0.833333]


## Learning and Revision time



Scratch: [ 1.283  1.426  1.563 11.468  1.331  1.269  1.379  1.689  1.352  0.75 ]
Transfer: [1.112 2.298 1.294 2.459 1.119 1.143 1.232 1.796 0.972 1.579]
Transfer & Revision: [2.281 3.886 2.861 3.965 1.72  2.21  2.57  3.22  1.945 2.413]


## Inference time



Scratch: [0.664 0.517 0.846 0.45  0.416 0.559 0.585 0.665 0.805 0.634]
Transfer: [1.112 2.298 1.294 2.459 1.119 1.143 1.232 1.796 0.972 1.579]
Transfer & Revision: [1.099 0.581 1.445 0.722 0.423 0.582 0.568 0.549 0.531 0.542]


# Results for 7_imdb_cora

# Results for 8_imdb_cora

# Results for 9_imdb_cora

# Results for 10_imdb_cora

# Results for 11_uwcse_cora

# Results for 12_uwcse_cora

# Results for 13_uwcse_cora

# Results for 14_uwcse_cora

# Results for 15_yeast_twitter

# Results for 16_yeast_twitter

# Results for 17_yeast_twitter

# Results for 18_yeast_twitter

# Results for 19_yeast_twitter

# Results for 20_yeast_twitter

# Results for 21_yeast_twitter

# Results for 22_twitter_yeast

# Results for 23_twitter_yeast

# Results for 24_twitter_yeast

# Results for 25_twitter_yeast

# Results for 26_twitter_yeast

# Results for 27_twitter_yeast

# Results for 28_twitter_yeast

# Results for 29_nell_sports_nell_finances

# Results for 30_nell_sports_nell_finances

# Results for 31_nell_sports_nell_finances

# Results for 32_nell_sports_nell_finances

# Results for 33_nell_sports_nell_finances

# Results for 34_nell_sports_nell_finances

# Results for 35_nell_sports_nell_finances

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=1.4419115471820416, pvalue=0.28606944512622406)
Ttest_relResult(statistic=1.874877364354068, pvalue=0.20164949259959403)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.286
1,transferRDN-B,0.202


T-test for experiment 2
Ttest_relResult(statistic=1.3929983513315243, pvalue=0.29825714397447667)
Ttest_relResult(statistic=1.548629751932808, pvalue=0.2615732174579369)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.298
1,transferRDN-B,0.262




Scratch: [0.586735 0.653061 0.802734 0.545918 0.653061 0.808594]
Transfer: [0.887755 0.716837 0.875    0.890306 0.693878 0.875   ]
Transfer & Revision: [0.818878 0.732143 0.794922 0.798469 0.709184 0.814453]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=1.18429938913556, pvalue=0.35796561585754183)
Ttest_relResult(statistic=1.4819080411135122, pvalue=0.2765627737974175)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.358
1,transferRDN-B,0.277


T-test for experiment 2
Ttest_relResult(statistic=1.214393021500958, pvalue=0.3485254487108007)
Ttest_relResult(statistic=1.3222028341807381, pvalue=0.317055318097611)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.349
1,transferRDN-B,0.317




Scratch: [0.570559 0.730226 0.84381  0.545399 0.730226 0.853288]
Transfer: [0.928452 0.787069 0.886249 0.922247 0.780312 0.876913]
Transfer & Revision: [0.845443 0.792743 0.820927 0.838769 0.783905 0.842971]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=1.4675471684166286, pvalue=0.27992989122829515)
Ttest_relResult(statistic=3.0810336364333004, pvalue=0.09116694429038479)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.28
1,transferRDN-B,0.091


T-test for experiment 2
Ttest_relResult(statistic=1.4734106847244168, pvalue=0.2785489109198853)
Ttest_relResult(statistic=3.4715891316342073, pvalue=0.07389481809393207)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.279
1,transferRDN-B,0.074




Scratch: [-0.778962 -0.712691 -0.600497 -0.792655 -0.712691 -0.627312]
Transfer: [-0.519091 -0.624733 -0.470274 -0.514962 -0.609799 -0.470019]
Transfer & Revision: [-0.54019  -0.624647 -0.609709 -0.539966 -0.718417 -0.540207]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=1.0, pvalue=0.42264973081037427)
Ttest_relResult(statistic=0.1817286476094054, pvalue=0.8725464305171351)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.423
1,transferRDN-B,0.873


T-test for experiment 2
Ttest_relResult(statistic=0.9999999999999999, pvalue=0.42264973081037427)
Ttest_relResult(statistic=0.4166097685044111, pvalue=0.7174188015008727)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.423
1,transferRDN-B,0.717




Scratch: [0.5      0.5      0.875    0.428571 0.5      0.8125  ]
Transfer: [0.857143 0.357143 0.75     0.857143 0.357143 0.75    ]
Transfer & Revision: [0.857143 0.5      0.875    0.714286 0.5      0.8125  ]


## F1

T-test for experiment 1
Ttest_relResult(statistic=1.0321559009954324, pvalue=0.4104704722314203)
Ttest_relResult(statistic=0.7378475942653685, pvalue=0.5374354519196187)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.41
1,transferRDN-B,0.537


T-test for experiment 2
Ttest_relResult(statistic=2.252579312476151, pvalue=0.15307670656845154)
Ttest_relResult(statistic=0.8699955891710288, pvalue=0.47602912348217286)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.153
1,transferRDN-B,0.476




Scratch: [0.518519 0.583333 0.756757 0.444444 0.583333 0.722222]
Transfer: [0.888889 0.5      0.774194 0.888889 0.5      0.774194]
Transfer & Revision: [0.75     0.636364 0.717949 0.645161 0.636364 0.787879]


## Precision



Scratch: [0.538462 0.7      0.666667 0.461538 0.7      0.65    ]
Transfer: [0.923077 0.833333 0.8      0.923077 0.833333 0.8     ]
Transfer & Revision: [0.666667 0.875    0.608696 0.588235 0.875    0.764706]


## Learning and Revision time



Scratch: [2.58  3.967 1.963 4.177 5.264 2.968]
Transfer: [2.798 2.898 1.993 1.983 2.769 1.732]
Transfer & Revision: [7.375 6.963 4.07  5.528 6.353 3.504]


## Inference time



Scratch: [0.845 0.791 0.597 0.784 0.699 0.714]
Transfer: [2.798 2.898 1.993 1.983 2.769 1.732]
Transfer & Revision: [0.858 0.75  0.922 0.744 0.601 1.136]


# Results for 36_nell_sports_nell_finances

# Results for 37_nell_sports_nell_finances

## AUC ROC

T-test for experiment 1
Ttest_relResult(statistic=4.6362531447146385, pvalue=0.04350905001579996)
Ttest_relResult(statistic=3.752946592381847, pvalue=0.06423425795411473)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.044
1,transferRDN-B,0.064


T-test for experiment 2
Ttest_relResult(statistic=7.856472882746483, pvalue=0.015817734097657143)
Ttest_relResult(statistic=3.9273534185356898, pvalue=0.05914056034799987)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.016
1,transferRDN-B,0.059




Scratch: [0.656561 0.746221 0.650564 0.737191 0.716032 0.704314]
Transfer: [0.813615 0.805888 0.815971 0.770404 0.801619 0.763648]
Transfer & Revision: [0.814689 0.826124 0.828358 0.843827 0.883056 0.84154 ]


## AUC PR

T-test for experiment 1
Ttest_relResult(statistic=4.062383441543728, pvalue=0.05559056447891556)
Ttest_relResult(statistic=4.05941587447771, pvalue=0.05566520821013106)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.056
1,transferRDN-B,0.056


T-test for experiment 2
Ttest_relResult(statistic=6.457874200589222, pvalue=0.0231490675978073)
Ttest_relResult(statistic=2.347637627780465, pvalue=0.14341483921237433)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.023
1,transferRDN-B,0.143




Scratch: [0.687117 0.766821 0.685156 0.757499 0.737309 0.732857]
Transfer: [0.788659 0.813193 0.804357 0.769075 0.811302 0.774232]
Transfer & Revision: [0.822835 0.820615 0.812044 0.840975 0.881888 0.846539]


## CLL

T-test for experiment 1
Ttest_relResult(statistic=6.263897698694941, pvalue=0.02455180668145851)
Ttest_relResult(statistic=4.658063908691707, pvalue=0.04312847091789625)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.025
1,transferRDN-B,0.043


T-test for experiment 2
Ttest_relResult(statistic=22.092695138470805, pvalue=0.0020425392820941943)
Ttest_relResult(statistic=4.130837034837883, pvalue=0.053908459934730805)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.002
1,transferRDN-B,0.054




Scratch: [-0.630559 -0.603246 -0.645568 -0.620291 -0.611903 -0.614619]
Transfer: [-0.543589 -0.547527 -0.524482 -0.568325 -0.531832 -0.580595]
Transfer & Revision: [-0.548248 -0.511502 -0.50975  -0.530988 -0.512988 -0.510207]


## Recall

T-test for experiment 1
Ttest_relResult(statistic=5.554909372246667, pvalue=0.03091269550912386)
Ttest_relResult(statistic=5.508111259648495, pvalue=0.03141560894339859)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.031
1,transferRDN-B,0.031


T-test for experiment 2
Ttest_relResult(statistic=8.333924579246682, pvalue=0.014094283648443525)
Ttest_relResult(statistic=6.8459480763101, pvalue=0.020677484680479204)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.014
1,transferRDN-B,0.021




Scratch: [0.194981 0.312741 0.180769 0.27027  0.291506 0.257692]
Transfer: [0.73166  0.637066 0.809615 0.741313 0.579151 0.717308]
Transfer & Revision: [0.608108 0.698842 0.842308 0.604247 0.65444  0.746154]


## F1

T-test for experiment 1
Ttest_relResult(statistic=5.985977312005603, pvalue=0.026791597286138502)
Ttest_relResult(statistic=5.054863533107251, pvalue=0.036979203774661275)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.027
1,transferRDN-B,0.037


T-test for experiment 2
Ttest_relResult(statistic=20.899442892136637, pvalue=0.0022816144610511356)
Ttest_relResult(statistic=14.701925022987716, pvalue=0.004594628598135102)


Unnamed: 0,p-value,RDN-B
0,transferRDN-B Ref,0.002
1,transferRDN-B,0.005




Scratch: [0.322169 0.464183 0.303716 0.41791  0.438953 0.403008]
Transfer: [0.755733 0.699153 0.787652 0.732126 0.689655 0.707109]
Transfer & Revision: [0.71267  0.741803 0.807373 0.714612 0.764374 0.753398]


## Precision



Scratch: [0.926606 0.9      0.949495 0.921053 0.888235 0.924138]
Transfer: [0.781443 0.774648 0.766849 0.723164 0.852273 0.697196]
Transfer & Revision: [0.860656 0.790393 0.775221 0.874302 0.918699 0.760784]


## Learning and Revision time



Scratch: [24.324 12.578  9.775  9.586  9.131 17.278]
Transfer: [ 8.967  9.232 30.577 18.092 24.389 48.789]
Transfer & Revision: [18.857 21.304 51.588 31.056 46.221 77.671]


## Inference time



Scratch: [1.326 1.371 1.746 1.448 1.398 1.518]
Transfer: [ 8.967  9.232 30.577 18.092 24.389 48.789]
Transfer & Revision: [1.762 2.11  3.403 1.98  1.699 2.66 ]


# Results for 38_nell_finances_nell_sports

# Results for 39_nell_finances_nell_sports

# Results for 40_nell_finances_nell_sports

# Results for 41_nell_finances_nell_sports

# Results for 42_nell_finances_nell_sports

# Results for 43_nell_finances_nell_sports

# Results for 44_nell_finances_nell_sports

# Results for 45_nell_finances_nell_sports

# Results for 46_nell_finances_nell_sports

In [6]:
def paired_ttest_kfold_cv(estimator1, estimator2):
    score_diff = []
    cv = len(estimator1)
    for i in range(len(estimator1)):
        score_diff.append(estimator1[i] - estimator2[i])

    avg_diff = np.mean(score_diff)

    numerator = avg_diff * np.sqrt(cv)
    denominator = np.sqrt(sum([(diff - avg_diff)**2 for diff in score_diff])
                          / (cv - 1))
    t_stat = numerator / denominator

    pvalue = stats.t.sf(np.abs(t_stat), cv - 1)*2.
    return float(t_stat), float(pvalue)

In [7]:
paired_ttest_kfold_cv([0.693686, 0.694682, 0.68722,  0.660296],
[0.636807, 0.636639, 0.634388, 0.611234])

(26.497231209975535, 0.00011793614005630308)