# Inerpretation-Net Training

# Experiment 1: I-Net Performance for Different Algebras and Complexities
# Experiment 2: I-Net Performance Comparison for λ-Nets with Different Training Levels
# Experiment 3: I-Net Performance Comparison Different Training Data Sizes

## Specitication of Experiment Settings

In [1]:
#######################################################################################################################################
###################################################### CONFIG FILE ####################################################################
#######################################################################################################################################
sleep_time = 0 #minutes


config = {
    'data': {
        'd': 5, #degree
        'n': 1, #number of variables
        'sparsity': None,
        'sample_sparsity': None,
        'x_max': 1,
        'x_min': 0,
        'x_distrib': 'uniform', #'normal', 'uniform', 'beta', 'Gamma', 'laplace'
        'a_max': 1,
        'a_min': -1,
        'lambda_nets_total': 10000,
        'noise': 0,
        'noise_distrib': 'normal', #'normal', 'uniform', 'beta', 'Gamma', 'laplace'
        
        'same_training_all_lambda_nets': False,

        'fixed_seed_lambda_training': True,
        'fixed_initialization_lambda_training': False,
        'number_different_lambda_trainings': 1,
    },
    'lambda_net': {
        'epochs_lambda': 1000,
        'early_stopping_lambda': True,  #if early stopping is used, multi_epoch_analysis is deactivated
        'batch_lambda': 64,
        'dropout': 0,
        'lambda_network_layers': [5*'sparsity'],
        'optimizer_lambda': 'adam',
        'loss_lambda': 'mae',
        'number_of_lambda_weights': None,
        'lambda_dataset_size': 1000,
    },
    'i_net': {
        'optimizer': 'custom',#adam
        'inet_loss': 'mae',
        'inet_metrics': ['r2'],
        'dropout': 0.25,
        'epochs': 500,
        'early_stopping': True,
        'batch_size': 512,
        'dense_layers': [512, 1024],
        'convolution_layers': None,
        'lstm_layers': None,
        'interpretation_dataset_size': 10000,
                
        'interpretation_net_output_monomials': 3, #(None, int)
        'interpretation_net_output_shape': None, #calculated automatically later
        
        'evaluate_with_real_function': False,
        'consider_labels_training': False,
                      
        'data_reshape_version': None, #default to 2 options:(None, 0,1 2)
        'nas': True,
        'nas_type': 'CNN', #options:(None, 'CNN', 'LSTM', 'CNN-LSTM', 'CNN-LSTM-parallel')      
        'nas_trials': 100,
    },
    'evaluation': {   
        'inet_holdout_seed_evaluation': False,
        
        #set if multi_epoch_analysis should be performed
        'multi_epoch_analysis': True,
        'each_epochs_save_lambda': 20,
        'epoch_start': 0, #use to skip first epochs in multi_epoch_analysis
        
        #set if samples analysis should be performed
        'samples_list': None,#[100, 500, 750, 1000, 2500, 5000, 7500, 10000, 15000, 20000, 25000, 28125] 
       
        'random_evaluation_dataset_size': 500,
    },
    'computation':{
        'n_jobs': 1,
        'use_gpu': True,
        'gpu_numbers': '0',
        'RANDOM_SEED': 42,   
    }
}

## Imports

In [2]:
#######################################################################################################################################
########################################### IMPORT GLOBAL VARIABLES FROM CONFIG #######################################################
#######################################################################################################################################
globals().update(config['data'])
globals().update(config['lambda_net'])
globals().update(config['i_net'])
globals().update(config['evaluation'])
globals().update(config['computation'])

In [3]:
#######################################################################################################################################
##################################################### IMPORT LIBRARIES ################################################################
#######################################################################################################################################
from itertools import product       
from tqdm import tqdm_notebook as tqdm
import pickle
import numpy as np
import pandas as pd
import scipy as sp
import timeit
import psutil

from functools import reduce
from more_itertools import random_product 
from sklearn.preprocessing import Normalizer

import sys
import os
import shutil

import logging

from prettytable import PrettyTable
import colored
import math

import time
from datetime import datetime
from collections.abc import Iterable


from joblib import Parallel, delayed

from scipy.integrate import quad

from sklearn.model_selection import cross_val_score, train_test_split, StratifiedKFold, KFold
from sklearn.metrics import accuracy_score, log_loss, roc_auc_score, f1_score, mean_absolute_error, r2_score
from similaritymeasures import frechet_dist, area_between_two_curves, dtw
import keras
from keras.models import Sequential
from keras.layers.core import Dense, Dropout
from keras.utils import plot_model
from IPython.display import Image

import keras.backend as K
from livelossplot import PlotLossesKerasTF
from keras_tqdm import TQDMNotebookCallback
from keras.callbacks import EarlyStopping, ModelCheckpoint, ReduceLROnPlateau

from matplotlib import pyplot as plt
import seaborn as sns


import tensorflow as tf
import random 


import warnings


from IPython.display import display, Math, Latex



In [None]:
sys.path.append('..')

from utilities.InterpretationNet import *
from utilities.LambdaNet import *
from utilities.metrics import *
from utilities.utility_functions import *

In [4]:
#######################################################################################################################################
################################################### VARIABLE ADJUSTMENTS ##############################################################
#######################################################################################################################################
variables = 'abcdefghijklmnopqrstuvwxyz'[:n]

n_jobs = min((epochs_lambda//each_epochs_save_lambda+1, n_jobs)) if multi_epoch_analysis else min(len(samples_list), n_jobs) if samples_list!=None else 1

multi_epoch_analysis = False if early_stopping_lambda else multi_epoch_analysis #deactivate multi_epoch_analysis if early stopping is used

each_epochs_save_lambda = each_epochs_save_lambda if multi_epoch_analysis else epochs_lambda
epochs_save_range_lambda = range(epoch_start//each_epochs_save_lambda, epochs_lambda//each_epochs_save_lambda) if each_epochs_save_lambda == 1 else range(epoch_start//each_epochs_save_lambda, epochs_lambda//each_epochs_save_lambda+1) if multi_epoch_analysis else range(1,2)

data_reshape_version = 2 if data_reshape_version == None and (convolution_layers != None or lstm_layers != None or (nas and nas_type != 'SEQUENTIAL')) else data_reshape_version
#######################################################################################################################################
###################################################### SET VARIABLES + DESIGN #########################################################
#######################################################################################################################################

#os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2' 
os.environ['CUDA_VISIBLE_DEVICES'] = gpu_numbers if use_gpu else ''

logging.getLogger('tensorflow').disabled = True

sns.set_style("darkgrid")
#np.set_printoptions(suppress=True)

random.seed(RANDOM_SEED)
np.random.seed(RANDOM_SEED)
if int(tf.__version__[0]) >= 2:
    tf.random.set_seed(RANDOM_SEED)
else:
    tf.set_random_seed(RANDOM_SEED)
    
    
pd.set_option('display.float_format', lambda x: '%.3f' % x)
pd.set_option('display.max_columns', 500)

warnings.filterwarnings('ignore')

In [5]:
#######################################################################################################################################
####################################################### CONFIG ADJUSTMENTS ############################################################
#######################################################################################################################################
config['evaluation']['multi_epoch_analysis'] = multi_epoch_analysis

config['evaluation']['each_epochs_save_lambda'] = each_epochs_save_lambda

config['i_net']['data_reshape_version'] = data_reshape_version

config['data']['sparsity'] = nCr(config['data']['n']+config['data']['d'], config['data']['d'])
config['data']['sample_sparsity'] = config['data']['sparsity'] if config['data']['sample_sparsity'] == None else config['data']['sample_sparsity']

config['i_net']['interpretation_net_output_shape'] = config['data']['sparsity'] if config['i_net']['interpretation_net_output_monomials'] is None else 2*config['i_net']['interpretation_net_output_monomials']


transformed_layers = []
for layer in config['lambda_net']['lambda_network_layers']:
    if type(layer) == str:
        transformed_layers.append(layer.count('sparsity')*config['data']['sparsity'])
    else:
        transformed_layers.append(layer)
config['lambda_net']['lambda_network_layers'] = transformed_layers

layers_with_input_output = list(flatten([[config['data']['n']], config['lambda_net']['lambda_network_layers'], [1]]))
number_of_lambda_weights = 0
for i in range(len(layers_with_input_output)-1):
    number_of_lambda_weights += (layers_with_input_output[i]+1)*layers_with_input_output[i+1]  
config['lambda_net']['number_of_lambda_weights'] = number_of_lambda_weights
    
#######################################################################################################################################
################################################## UPDATE VARIABLES ###################################################################
#######################################################################################################################################
globals().update(config['data'])
globals().update(config['lambda_net'])
globals().update(config['i_net'])
globals().update(config['evaluation'])
globals().update(config['computation'])



initialize_LambdaNet_config_from_curent_notebook(config)
initialize_metrics_config_from_curent_notebook(config)
initialize_utility_functions_config_from_curent_notebook(config)
initialize_InterpretationNet_config_from_curent_notebook(config)


#######################################################################################################################################
###################################################### PATH + FOLDER CREATION #########################################################
#######################################################################################################################################
globals().update(generate_paths(path_type='interpretation_net'))
create_folders_inet()

#######################################################################################################################################
############################################################ SLEEP TIMER ##############################################################
#######################################################################################################################################
sleep_minutes(sleep_time)

In [6]:
print(path_identifier_interpretation_net_data)

print(path_identifier_lambda_net_data)


inet_dense[512, 1024]convNonelstmNoneoutput_6_drop0.25e500b512_customlnets_10000_30-1000eES64b_adam_mae_train_1000_var_1_d_5_sparsity_6_amin_-1_amax_1_xmin_0_xmax_1_xdist_uniform_noise_normal_0_diffX_1-FixSeed_42
lnets_10000_30-1000eES64b_adam_mae_train_1000_var_1_d_5_sparsity_6_amin_-1_amax_1_xmin_0_xmax_1_xdist_uniform_noise_normal_0_diffX_1-FixSeed_42


In [7]:
print("Num GPUs Available: ", len(tf.config.experimental.list_physical_devices('GPU')))
print("Num XLA-GPUs Available: ", len(tf.config.experimental.list_physical_devices('XLA_GPU')))

Num GPUs Available:  1
Num XLA-GPUs Available:  1


## Utility functions

### Generate List of Monomial Identifiers

In [8]:
list_of_monomial_identifiers_extended = []
for i in tqdm(range((d+1)**n)):    
    monomial_identifier = dec_to_base(i, base = (d+1)).zfill(n) 
    list_of_monomial_identifiers_extended.append(monomial_identifier)

print('List length: ' + str(len(list_of_monomial_identifiers_extended)))
print('Number of monomials in a polynomial with ' + str(n) + ' variables and degree ' + str(d) + ': ' + str(nCr(n+d, d)))
print('Sparsity: ' + str(sparsity))
print(list_of_monomial_identifiers_extended)

list_of_monomial_identifiers = []
for monomial_identifier in tqdm(list_of_monomial_identifiers_extended):
    monomial_identifier_values = list(map(int, list(monomial_identifier)))
    if sum(monomial_identifier_values) <= d:
        list_of_monomial_identifiers.append(monomial_identifier)

print('List length: ' + str(len(list_of_monomial_identifiers)))
print('Number of monomials in a polynomial with ' + str(n) + ' variables and degree ' + str(d) + ': ' + str(nCr(n+d, d)))
print('Sparsity: ' + str(sparsity))
print(list_of_monomial_identifiers)


layers_with_input_output = list(flatten([[n], lambda_network_layers, [1]]))
number_of_lambda_weights = 0
for i in range(len(layers_with_input_output)-1):
    number_of_lambda_weights += (layers_with_input_output[i]+1)*layers_with_input_output[i+1]

  0%|          | 0/6 [00:00<?, ?it/s]

List length: 6
Number of monomials in a polynomial with 1 variables and degree 5: 6
Sparsity: 6
['0', '1', '2', '3', '4', '5']


  0%|          | 0/6 [00:00<?, ?it/s]

List length: 6
Number of monomials in a polynomial with 1 variables and degree 5: 6
Sparsity: 6
['0', '1', '2', '3', '4', '5']


## Load Data and Generate Datasets

In [9]:
def load_lambda_nets(index):
    
    if psutil.virtual_memory().percent > 80:
        raise SystemExit("Out of RAM!")
    
    path = './data/weights/' + 'weights_' + path_identifier_lambda_net_data + '/weights_' + path_identifier_lambda_net_data + '_epoch_' + str(index).zfill(3) + '.txt'

    
    weight_data = pd.read_csv(path, sep=",", header=None)
    weight_data = weight_data.sort_values(by=0).sample(frac=1, random_state=RANDOM_SEED)
    weight_data = weight_data.sort_values(by=0).sample(n=interpretation_dataset_size, random_state=RANDOM_SEED)

    lambda_nets = []
    for _, row in weight_data.iterrows():
        lambda_net = LambdaNet(row.values)
        lambda_nets.append(lambda_net)
        
    lambda_net_dataset = LambdaNetDataset(lambda_nets)
        
    return lambda_net_dataset
    

In [10]:
#LOAD DATA

parallel = Parallel(n_jobs=n_jobs, verbose=3, backend='multiprocessing')
lambda_net_dataset_list = parallel(delayed(load_lambda_nets)((i+1)*each_epochs_save_lambda if each_epochs_save_lambda==1 else i*each_epochs_save_lambda if i > 1 else each_epochs_save_lambda if i==1 else 1) for i in epochs_save_range_lambda)  
del parallel

lambda_net_dataset = lambda_net_dataset_list[-1]


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    4.9s remaining:    0.0s
[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    4.9s finished


## Data Inspection

In [11]:
lambda_net_dataset.as_pandas().head()

Unnamed: 0,seed,0-target,1-target,2-target,3-target,4-target,5-target,0-lstsq_lambda,1-lstsq_lambda,2-lstsq_lambda,3-lstsq_lambda,4-lstsq_lambda,5-lstsq_lambda,0-lstsq_target,1-lstsq_target,2-lstsq_target,3-lstsq_target,4-lstsq_target,5-lstsq_target,wb_0,wb_1,wb_2,wb_3,wb_4,wb_5,wb_6,wb_7,wb_8,wb_9,wb_10,wb_11,wb_12,wb_13,wb_14,wb_15,wb_16,wb_17,wb_18,wb_19,wb_20,wb_21,wb_22,wb_23,wb_24,wb_25,wb_26,wb_27,wb_28,wb_29,wb_30,wb_31,wb_32,wb_33,wb_34,wb_35,wb_36,wb_37,wb_38,wb_39,wb_40,wb_41,wb_42,wb_43,wb_44,wb_45,wb_46,wb_47,wb_48,wb_49,wb_50,wb_51,wb_52,wb_53,wb_54,wb_55,wb_56,wb_57,wb_58,wb_59,wb_60,wb_61,wb_62,wb_63,wb_64,wb_65,wb_66,wb_67,wb_68,wb_69,wb_70,wb_71,wb_72,wb_73,wb_74,wb_75,wb_76,wb_77,wb_78,wb_79,wb_80,wb_81,wb_82,wb_83,wb_84,wb_85,wb_86,wb_87,wb_88,wb_89,wb_90
6252,1373158606,0.924,0.492,-0.142,-0.402,-0.741,0.255,0.932,0.453,-0.415,1.317,-3.572,1.7,0.932,0.453,-0.415,1.317,-3.572,1.7,-0.009,-0.227,0.442,0.385,0.197,0.132,0.469,-0.297,0.369,0.089,0.602,-0.088,-0.019,0.486,0.119,0.538,-0.013,0.231,0.292,0.257,-0.023,0.042,0.008,-0.042,-0.404,-0.09,0.363,-0.291,-0.209,-0.233,0.0,0.0,-0.224,-0.252,0.23,0.23,-0.334,0.0,-0.287,0.292,-0.172,0.0,0.0,-0.283,0.239,-0.222,0.228,0.25,0.223,0.239,0.283,-0.047,-0.023,0.0,0.0,0.0,-0.298,0.0,0.0,0.0,-0.254,-0.359,-0.62,-0.768,0.348,0.404,-0.558,-0.408,-0.881,0.124,-0.408,-0.352,-0.364,-0.506,0.345,-0.494,0.682,0.222,0.358,0.252,0.332,-0.31,-0.044,-0.261,-0.383,-0.059,-1.071,0.144,-0.258,-0.315,0.199
4684,1373158606,-0.794,0.241,-0.127,-0.188,-0.535,-0.939,-0.516,-0.878,0.013,-0.029,0.029,-0.011,-0.516,-0.878,0.013,-0.029,0.029,-0.011,-0.009,-0.227,0.356,0.25,0.176,0.08,0.313,-0.297,0.217,0.381,0.48,-0.088,-0.019,0.359,0.078,0.465,0.008,0.23,0.269,0.248,0.033,0.164,0.106,-0.042,-0.404,-0.09,0.176,-0.291,-0.209,-0.233,0.0,0.0,0.115,0.115,-0.0,-0.082,0.121,0.0,0.115,0.141,0.119,0.0,0.0,0.12,-0.08,0.116,-0.023,-0.01,-0.001,-0.001,-0.04,0.114,0.132,0.0,0.0,0.0,0.114,0.0,0.0,0.0,-0.254,-0.359,-0.385,-0.385,0.136,0.187,-0.227,-0.408,-0.411,-0.115,-0.248,-0.352,-0.364,-0.243,0.121,-0.325,0.394,0.02,0.193,0.072,0.049,-0.455,-0.188,-0.261,-0.383,-0.059,-0.481,0.144,-0.258,-0.315,-0.108
1731,1373158606,-0.739,0.951,0.737,0.786,0.773,0.083,-0.732,0.641,3.214,-6.635,10.057,-4.01,-0.732,0.641,3.214,-6.635,10.057,-4.01,-0.009,-0.227,-0.113,0.087,0.748,0.719,0.12,-0.297,0.069,0.915,0.313,-0.088,-0.019,0.379,0.731,0.032,0.582,0.849,0.849,0.854,0.724,0.04,0.007,-0.042,-0.404,-0.09,0.047,-0.291,-0.209,-0.233,0.0,0.0,0.424,-0.096,-0.319,-0.453,-0.12,0.0,-0.081,-0.49,0.08,0.0,0.0,0.0,-0.522,0.423,-0.495,-0.244,0.0,-0.07,-0.573,-0.055,-0.025,0.0,0.0,0.0,-0.06,0.0,0.0,0.0,-0.254,-0.359,-0.433,-0.219,0.883,1.113,-0.006,-0.408,-0.254,0.726,0.047,-0.352,-0.364,0.221,1.094,-0.267,1.565,0.684,0.773,0.655,1.154,-0.307,-0.043,-0.261,-0.383,-0.059,-0.332,0.144,-0.258,-0.315,-0.44
4742,1373158606,0.173,-0.607,-0.085,0.746,-0.828,-0.939,0.167,-0.416,-1.639,5.49,-6.843,1.735,0.167,-0.416,-1.639,5.49,-6.843,1.735,-0.009,-0.227,0.418,0.533,0.125,0.058,0.582,-0.297,0.52,0.657,0.558,-0.088,-0.019,0.437,0.06,0.538,0.007,0.194,0.21,0.202,0.03,0.486,0.561,-0.042,-0.404,-0.09,0.494,-0.291,-0.209,-0.233,0.0,0.0,-0.001,-0.36,0.095,0.099,-0.343,0.0,-0.385,-0.303,-0.001,0.0,0.0,-0.001,0.094,-0.001,-0.026,0.023,0.098,0.078,-0.047,-0.429,-0.478,0.0,0.0,0.0,-0.395,0.0,0.0,0.0,-0.254,-0.359,-0.421,-1.069,0.133,0.18,-0.792,-0.408,-1.191,-0.539,-0.299,-0.352,-0.364,-0.292,0.113,-0.376,0.392,0.002,0.161,0.042,0.043,-1.392,-1.335,-0.261,-0.383,-0.059,-1.363,0.144,-0.258,-0.315,0.111
4521,1373158606,0.131,0.208,0.871,0.323,0.573,0.164,0.118,0.296,1.074,-1.688,4.175,-1.75,0.118,0.296,1.074,-1.688,4.175,-1.75,-0.009,-0.227,0.127,0.082,0.629,0.546,0.108,-0.297,0.067,1.027,0.457,-0.088,-0.019,0.125,0.587,0.271,0.286,0.74,0.589,0.714,0.661,0.041,0.008,-0.042,-0.404,-0.09,0.047,-0.291,-0.209,-0.233,0.0,0.0,-0.128,-0.084,-0.151,-0.2,-0.108,0.0,-0.069,-0.792,-0.249,0.0,0.0,-0.125,-0.4,-0.148,0.052,-0.449,0.041,-0.339,-0.558,-0.047,-0.022,0.0,0.0,0.0,-0.052,0.0,0.0,0.0,-0.254,-0.359,-0.193,-0.225,0.651,0.722,-0.036,-0.408,-0.258,0.888,0.336,-0.352,-0.364,-0.01,0.847,0.173,0.714,0.721,0.505,0.67,1.044,-0.31,-0.044,-0.261,-0.383,-0.059,-0.335,0.144,-0.258,-0.315,0.053


In [12]:
lambda_net_dataset.as_pandas().describe()

Unnamed: 0,seed,0-target,1-target,2-target,3-target,4-target,5-target,0-lstsq_lambda,1-lstsq_lambda,2-lstsq_lambda,3-lstsq_lambda,4-lstsq_lambda,5-lstsq_lambda,0-lstsq_target,1-lstsq_target,2-lstsq_target,3-lstsq_target,4-lstsq_target,5-lstsq_target,wb_0,wb_1,wb_2,wb_3,wb_4,wb_5,wb_6,wb_7,wb_8,wb_9,wb_10,wb_11,wb_12,wb_13,wb_14,wb_15,wb_16,wb_17,wb_18,wb_19,wb_20,wb_21,wb_22,wb_23,wb_24,wb_25,wb_26,wb_27,wb_28,wb_29,wb_30,wb_31,wb_32,wb_33,wb_34,wb_35,wb_36,wb_37,wb_38,wb_39,wb_40,wb_41,wb_42,wb_43,wb_44,wb_45,wb_46,wb_47,wb_48,wb_49,wb_50,wb_51,wb_52,wb_53,wb_54,wb_55,wb_56,wb_57,wb_58,wb_59,wb_60,wb_61,wb_62,wb_63,wb_64,wb_65,wb_66,wb_67,wb_68,wb_69,wb_70,wb_71,wb_72,wb_73,wb_74,wb_75,wb_76,wb_77,wb_78,wb_79,wb_80,wb_81,wb_82,wb_83,wb_84,wb_85,wb_86,wb_87,wb_88,wb_89,wb_90
count,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0,10000.0
mean,1373158606.0,0.001,-0.005,-0.0,0.004,-0.003,-0.003,0.005,-0.03,0.125,-0.478,0.727,-0.348,0.005,-0.03,0.125,-0.478,0.727,-0.348,-0.009,-0.227,0.293,0.203,0.291,0.233,0.286,-0.297,0.173,0.469,0.479,-0.088,-0.019,0.329,0.236,0.408,0.086,0.418,0.373,0.399,0.164,0.121,0.067,-0.042,-0.404,-0.09,0.133,-0.291,-0.209,-0.233,0.0,0.0,-0.013,-0.029,-0.008,-0.018,-0.051,0.0,-0.031,-0.085,-0.03,0.0,0.0,-0.041,-0.029,0.003,0.006,-0.062,0.025,-0.018,-0.027,-0.025,-0.004,0.0,0.0,0.0,-0.025,0.0,0.0,0.0,-0.254,-0.359,-0.381,-0.437,0.366,0.431,-0.236,-0.408,-0.48,0.035,-0.124,-0.352,-0.364,-0.215,0.379,-0.271,0.633,0.15,0.358,0.197,0.339,-0.531,-0.26,-0.261,-0.383,-0.059,-0.556,0.144,-0.258,-0.315,0.003
std,0.0,0.574,0.577,0.577,0.577,0.575,0.58,0.543,0.628,2.002,6.499,9.062,3.879,0.543,0.628,2.002,6.499,9.062,3.879,0.0,0.0,0.137,0.148,0.158,0.162,0.174,0.0,0.15,0.286,0.204,0.0,0.0,0.169,0.172,0.141,0.158,0.242,0.153,0.192,0.218,0.15,0.194,0.0,0.0,0.0,0.149,0.0,0.0,0.0,0.0,0.0,0.147,0.162,0.173,0.185,0.195,0.0,0.167,0.311,0.211,0.0,0.0,0.186,0.205,0.139,0.169,0.257,0.129,0.202,0.232,0.166,0.192,0.0,0.0,0.0,0.163,0.0,0.0,0.0,0.0,0.0,0.18,0.249,0.224,0.262,0.318,0.0,0.276,0.433,0.398,0.0,0.0,0.313,0.282,0.211,0.323,0.456,0.166,0.385,0.36,0.307,0.342,0.0,0.0,0.0,0.298,0.0,0.0,0.0,0.139
min,1373158606.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.035,-2.379,-17.459,-55.031,-87.127,-32.496,-1.035,-2.379,-17.459,-55.031,-87.127,-32.496,-0.009,-0.227,-0.163,-0.28,-0.204,-0.236,-0.174,-0.297,-0.321,-0.101,0.118,-0.088,-0.019,-0.111,-0.248,0.004,-0.296,-0.15,-0.084,-0.121,-0.339,-0.338,-0.4,-0.042,-0.404,-0.09,-0.325,-0.291,-0.209,-0.233,0.0,0.0,-0.513,-0.573,-0.632,-0.63,-1.03,0.0,-0.518,-1.209,-1.225,0.0,0.0,-1.04,-0.641,-1.053,-0.654,-1.207,-0.635,-1.101,-0.908,-0.555,-0.822,0.0,0.0,0.0,-0.529,0.0,0.0,0.0,-0.254,-0.359,-1.379,-1.924,-0.696,0.087,-1.23,-0.408,-1.917,-2.144,-1.359,-0.352,-0.364,-1.13,0.012,-1.456,0.324,-2.709,-1.016,-2.501,-0.408,-2.168,-2.306,-0.261,-0.383,-0.059,-2.119,0.144,-0.258,-0.315,-0.577
25%,1373158606.0,-0.491,-0.505,-0.506,-0.494,-0.497,-0.505,-0.445,-0.509,-0.889,-2.379,-3.065,-1.104,-0.445,-0.509,-0.889,-2.379,-3.065,-1.104,-0.009,-0.227,0.191,0.083,0.181,0.103,0.161,-0.297,0.067,0.284,0.358,-0.088,-0.019,0.219,0.099,0.321,0.008,0.261,0.274,0.27,0.033,0.041,0.008,-0.042,-0.404,-0.09,0.047,-0.291,-0.209,-0.233,0.0,0.0,-0.13,-0.092,-0.108,-0.082,-0.161,0.0,-0.077,-0.33,-0.07,0.0,0.0,-0.144,-0.087,-0.062,-0.023,-0.223,-0.023,-0.105,-0.042,-0.049,-0.023,0.0,0.0,0.0,-0.055,0.0,0.0,0.0,-0.254,-0.359,-0.42,-0.445,0.231,0.271,-0.28,-0.408,-0.486,-0.114,-0.263,-0.352,-0.364,-0.283,0.206,-0.344,0.394,0.101,0.26,0.142,0.055,-0.54,-0.296,-0.261,-0.383,-0.059,-0.563,0.144,-0.258,-0.315,-0.124
50%,1373158606.0,0.005,-0.005,0.002,0.003,-0.005,0.001,0.003,-0.022,0.011,-0.019,0.032,-0.017,0.003,-0.022,0.011,-0.019,0.032,-0.017,-0.009,-0.227,0.295,0.19,0.273,0.212,0.262,-0.297,0.149,0.381,0.437,-0.088,-0.019,0.309,0.21,0.403,0.013,0.356,0.358,0.359,0.089,0.06,0.008,-0.042,-0.404,-0.09,0.085,-0.291,-0.209,-0.233,0.0,0.0,-0.002,-0.003,-0.001,-0.001,-0.003,0.0,-0.003,0.023,-0.001,0.0,0.0,-0.003,-0.001,-0.001,-0.002,-0.002,-0.0,-0.001,-0.002,-0.046,-0.022,0.0,0.0,0.0,-0.051,0.0,0.0,0.0,-0.254,-0.359,-0.341,-0.362,0.314,0.359,-0.194,-0.408,-0.391,-0.025,-0.191,-0.352,-0.364,-0.2,0.296,-0.271,0.552,0.188,0.335,0.223,0.23,-0.433,-0.131,-0.261,-0.383,-0.059,-0.46,0.144,-0.258,-0.315,0.003
75%,1373158606.0,0.5,0.49,0.496,0.507,0.495,0.502,0.461,0.426,0.915,2.314,3.12,1.033,0.461,0.426,0.915,2.314,3.12,1.033,-0.009,-0.227,0.372,0.283,0.381,0.323,0.368,-0.297,0.253,0.588,0.533,-0.088,-0.019,0.403,0.329,0.478,0.151,0.505,0.459,0.484,0.266,0.184,0.088,-0.042,-0.404,-0.09,0.201,-0.291,-0.209,-0.233,0.0,0.0,0.116,0.112,0.136,0.137,0.11,0.0,0.112,0.154,0.111,0.0,0.0,0.112,0.138,0.117,0.139,0.134,0.136,0.135,0.155,0.111,0.129,0.0,0.0,0.0,0.111,0.0,0.0,0.0,-0.254,-0.359,-0.264,-0.265,0.394,0.439,-0.103,-0.408,-0.267,0.115,-0.105,-0.352,-0.364,-0.115,0.381,-0.192,0.664,0.27,0.413,0.303,0.352,-0.31,-0.044,-0.261,-0.383,-0.059,-0.335,0.144,-0.258,-0.315,0.136
max,1373158606.0,1.0,1.0,1.0,1.0,0.999,1.0,1.01,2.284,16.02,62.515,74.277,38.554,1.01,2.284,16.02,62.515,74.277,38.554,-0.009,-0.227,0.761,0.759,0.855,0.818,1.596,-0.297,0.665,1.889,2.038,-0.088,-0.019,1.741,0.855,1.363,0.951,1.863,1.014,1.416,1.142,0.776,1.109,-0.042,-0.404,-0.09,0.771,-0.291,-0.209,-0.233,0.0,0.0,0.424,0.366,0.367,0.262,0.322,0.0,0.32,0.314,0.297,0.0,0.0,0.325,0.265,0.506,0.295,0.265,0.458,0.327,0.339,0.337,0.401,0.0,0.0,0.0,0.324,0.0,0.0,0.0,-0.254,-0.359,-0.057,-0.149,1.752,1.522,2.888,-0.408,-0.197,2.185,2.635,-0.352,-0.364,2.555,1.957,2.762,2.664,1.424,1.648,1.408,2.834,-0.263,0.001,-0.261,-0.383,-0.059,-0.285,0.144,-0.258,-0.315,0.453


## Generate Datasets for Interpretation-Net training

In [13]:
#generate train, test and validation data for training
lambda_net_train_dataset_list = []
lambda_net_valid_dataset_list = []
lambda_net_test_dataset_list = []

for lambda_net_dataset in lambda_net_dataset_list:
    
    
    if inet_holdout_seed_evaluation:
        complete_seed_list = list(set(lambda_net_dataset.train_settings_list['seed']))#list(weight_data.iloc[:,1].unique())

        random.seed(RANDOM_SEED)
        test_seeds = random.sample(complete_seed_list, int(len(complete_seed_list)-len(complete_seed_list)/(1/0.9)))
        lambda_net_test_dataset = lambda_net_dataset.get_lambda_nets_by_seed(test_seeds)
        complete_seed_list = list(set(complete_seed_list) - set(test_seeds))#complete_seed_list.remove(test_seeds)
        
        random.seed(RANDOM_SEED)
        valid_seeds = random.sample(complete_seed_list, int(len(complete_seed_list)-len(complete_seed_list)/(1/0.9)))
        lambda_net_valid_dataset = lambda_net_dataset.get_lambda_nets_by_seed(valid_seeds)
        complete_seed_list = list(set(complete_seed_list) - set(valid_seeds))

        train_seeds = complete_seed_list
        lambda_net_train_dataset = lambda_net_dataset.get_lambda_nets_by_seed(train_seeds)       
        
        lambda_net_train_dataset_list.append(lambda_net_train_dataset)
        lambda_net_valid_dataset_list.append(lambda_net_valid_dataset)
        lambda_net_test_dataset_list.append(lambda_net_test_dataset)
        
        del lambda_net_dataset
    else:
        lambda_net_train_with_valid_dataset, lambda_net_test_dataset = split_LambdaNetDataset(lambda_net_dataset, test_split=0.1)
        lambda_net_train_dataset, lambda_net_valid_dataset = split_LambdaNetDataset(lambda_net_train_with_valid_dataset, test_split=0.1)

        lambda_net_train_dataset_list.append(lambda_net_train_dataset)
        lambda_net_valid_dataset_list.append(lambda_net_valid_dataset)
        lambda_net_test_dataset_list.append(lambda_net_test_dataset)
    
        del lambda_net_dataset, lambda_net_train_with_valid_dataset

        
del lambda_net_dataset_list

In [14]:
lambda_net_train_dataset_list[-1].as_pandas().shape

(8100, 110)

In [15]:
lambda_net_valid_dataset_list[-1].as_pandas().shape

(900, 110)

In [16]:
lambda_net_test_dataset_list[-1].as_pandas().shape

(1000, 110)

In [17]:
lambda_net_train_dataset_list[-1].as_pandas().head()

Unnamed: 0,seed,0-target,1-target,2-target,3-target,4-target,5-target,0-lstsq_lambda,1-lstsq_lambda,2-lstsq_lambda,3-lstsq_lambda,4-lstsq_lambda,5-lstsq_lambda,0-lstsq_target,1-lstsq_target,2-lstsq_target,3-lstsq_target,4-lstsq_target,5-lstsq_target,wb_0,wb_1,wb_2,wb_3,wb_4,wb_5,wb_6,wb_7,wb_8,wb_9,wb_10,wb_11,wb_12,wb_13,wb_14,wb_15,wb_16,wb_17,wb_18,wb_19,wb_20,wb_21,wb_22,wb_23,wb_24,wb_25,wb_26,wb_27,wb_28,wb_29,wb_30,wb_31,wb_32,wb_33,wb_34,wb_35,wb_36,wb_37,wb_38,wb_39,wb_40,wb_41,wb_42,wb_43,wb_44,wb_45,wb_46,wb_47,wb_48,wb_49,wb_50,wb_51,wb_52,wb_53,wb_54,wb_55,wb_56,wb_57,wb_58,wb_59,wb_60,wb_61,wb_62,wb_63,wb_64,wb_65,wb_66,wb_67,wb_68,wb_69,wb_70,wb_71,wb_72,wb_73,wb_74,wb_75,wb_76,wb_77,wb_78,wb_79,wb_80,wb_81,wb_82,wb_83,wb_84,wb_85,wb_86,wb_87,wb_88,wb_89,wb_90
3003,1373158606,-0.34,-0.876,-0.048,-0.46,0.43,0.914,-0.33,-1.242,2.828,-9.076,11.258,-3.884,-0.33,-1.242,2.828,-9.076,11.258,-3.884,-0.009,-0.227,0.355,0.249,0.431,0.417,0.313,-0.297,0.217,0.382,0.48,-0.088,-0.019,0.359,0.457,0.464,0.008,0.526,0.466,0.485,0.588,0.164,0.108,-0.042,-0.404,-0.09,0.176,-0.291,-0.209,-0.233,0.0,0.0,0.079,0.079,-0.283,-0.314,0.082,0.0,0.079,0.092,0.081,0.0,0.0,0.081,-0.367,0.08,-0.023,-0.374,-0.229,-0.288,-0.494,0.079,0.087,0.0,0.0,0.0,0.079,0.0,0.0,0.0,-0.254,-0.359,-0.371,-0.366,0.756,0.96,-0.211,-0.408,-0.39,-0.099,-0.236,-0.352,-0.364,-0.229,0.951,-0.313,0.394,0.632,0.617,0.587,1.399,-0.431,-0.156,-0.261,-0.383,-0.059,-0.458,0.144,-0.258,-0.315,-0.077
5985,1373158606,-0.496,-0.607,0.252,0.645,-0.276,-0.135,-0.513,-0.351,-0.981,3.278,-2.844,0.798,-0.513,-0.351,-0.981,3.278,-2.844,0.798,-0.009,-0.227,0.249,0.14,0.286,0.23,0.2,-0.297,0.107,0.25,0.373,-0.088,-0.019,0.249,0.228,0.359,0.008,0.352,0.382,0.364,0.22,0.053,-0.056,-0.042,-0.404,-0.09,0.066,-0.291,-0.209,-0.233,0.0,0.0,0.128,0.129,-0.129,-0.123,0.134,0.0,0.13,0.154,0.13,0.0,0.0,0.132,-0.134,0.128,-0.023,-0.141,-0.104,-0.123,-0.147,0.131,0.168,0.0,0.0,0.0,0.13,0.0,0.0,0.0,-0.254,-0.359,-0.314,-0.33,0.325,0.378,-0.163,-0.408,-0.365,-0.049,-0.168,-0.352,-0.364,-0.173,0.316,-0.245,0.393,0.199,0.348,0.234,0.328,-0.43,-0.23,-0.261,-0.383,-0.059,-0.45,0.144,-0.258,-0.315,-0.123
6925,1373158606,-0.316,0.287,0.323,-0.293,-0.713,0.105,-0.194,-0.21,0.593,-1.318,1.309,-0.478,-0.194,-0.21,0.593,-1.318,1.309,-0.478,-0.009,-0.227,0.268,0.162,0.256,0.194,0.223,-0.297,0.129,0.287,0.391,-0.088,-0.019,0.27,0.191,0.377,0.013,0.305,0.342,0.321,0.1,0.077,0.011,-0.042,-0.404,-0.09,0.089,-0.291,-0.209,-0.233,0.0,0.0,0.055,0.055,-0.009,-0.006,0.055,0.0,0.055,0.05,0.055,0.0,0.0,0.055,-0.006,0.055,-0.018,-0.011,-0.013,-0.012,-0.003,0.056,0.062,0.0,0.0,0.0,0.056,0.0,0.0,0.0,-0.254,-0.359,-0.287,-0.285,0.239,0.268,-0.128,-0.408,-0.31,-0.015,-0.152,-0.352,-0.364,-0.145,0.202,-0.229,0.395,0.121,0.279,0.161,0.105,-0.355,-0.104,-0.261,-0.383,-0.059,-0.381,0.144,-0.258,-0.315,-0.055
9619,1373158606,0.123,-0.67,0.322,-0.94,0.676,0.843,-0.003,-0.192,0.005,-0.011,0.011,-0.004,-0.003,-0.192,0.005,-0.011,0.011,-0.004,-0.009,-0.227,0.284,0.178,0.237,0.174,0.239,-0.297,0.145,0.301,0.407,-0.088,-0.019,0.286,0.171,0.392,0.033,0.285,0.323,0.301,0.077,0.093,0.032,-0.042,-0.404,-0.09,0.105,-0.291,-0.209,-0.233,0.0,0.0,0.001,0.001,-0.0,-0.0,0.001,0.0,0.001,0.0,0.0,0.0,0.0,0.001,-0.0,0.0,-0.0,-0.0,-0.0,-0.0,-0.0,0.001,0.003,0.0,0.0,0.0,0.001,0.0,0.0,0.0,-0.254,-0.359,-0.294,-0.286,0.219,0.248,-0.132,-0.408,-0.308,-0.022,-0.161,-0.352,-0.364,-0.152,0.182,-0.238,0.412,0.102,0.26,0.142,0.081,-0.345,-0.062,-0.261,-0.383,-0.059,-0.373,0.144,-0.258,-0.315,-0.0
6916,1373158606,-0.533,-0.333,0.694,-0.708,0.255,-0.974,-0.443,-0.531,0.059,-0.133,0.134,-0.049,-0.443,-0.531,0.059,-0.133,0.134,-0.049,-0.009,-0.227,0.315,0.209,0.218,0.151,0.27,-0.297,0.176,0.329,0.438,-0.088,-0.019,0.317,0.145,0.424,0.008,0.261,0.301,0.279,0.033,0.124,0.055,-0.042,-0.404,-0.09,0.136,-0.291,-0.209,-0.233,0.0,0.0,0.106,0.107,-0.003,-0.002,0.111,0.0,0.107,0.129,0.109,0.0,0.0,0.11,-0.002,0.107,-0.023,-0.004,-0.005,-0.004,-0.039,0.107,0.125,0.0,0.0,0.0,0.106,0.0,0.0,0.0,-0.254,-0.359,-0.351,-0.353,0.195,0.213,-0.194,-0.408,-0.38,-0.082,-0.213,-0.352,-0.364,-0.21,0.144,-0.29,0.393,0.075,0.234,0.115,0.049,-0.427,-0.17,-0.261,-0.383,-0.059,-0.452,0.144,-0.258,-0.315,-0.101


In [18]:
lambda_net_valid_dataset_list[-1].as_pandas().head()

Unnamed: 0,seed,0-target,1-target,2-target,3-target,4-target,5-target,0-lstsq_lambda,1-lstsq_lambda,2-lstsq_lambda,3-lstsq_lambda,4-lstsq_lambda,5-lstsq_lambda,0-lstsq_target,1-lstsq_target,2-lstsq_target,3-lstsq_target,4-lstsq_target,5-lstsq_target,wb_0,wb_1,wb_2,wb_3,wb_4,wb_5,wb_6,wb_7,wb_8,wb_9,wb_10,wb_11,wb_12,wb_13,wb_14,wb_15,wb_16,wb_17,wb_18,wb_19,wb_20,wb_21,wb_22,wb_23,wb_24,wb_25,wb_26,wb_27,wb_28,wb_29,wb_30,wb_31,wb_32,wb_33,wb_34,wb_35,wb_36,wb_37,wb_38,wb_39,wb_40,wb_41,wb_42,wb_43,wb_44,wb_45,wb_46,wb_47,wb_48,wb_49,wb_50,wb_51,wb_52,wb_53,wb_54,wb_55,wb_56,wb_57,wb_58,wb_59,wb_60,wb_61,wb_62,wb_63,wb_64,wb_65,wb_66,wb_67,wb_68,wb_69,wb_70,wb_71,wb_72,wb_73,wb_74,wb_75,wb_76,wb_77,wb_78,wb_79,wb_80,wb_81,wb_82,wb_83,wb_84,wb_85,wb_86,wb_87,wb_88,wb_89,wb_90
8323,1373158606,0.31,0.452,0.977,-0.064,-0.261,0.704,0.292,0.485,2.454,-7.149,10.453,-4.491,0.292,0.485,2.454,-7.149,10.453,-4.491,-0.009,-0.227,0.131,0.082,0.367,0.303,0.11,-0.297,0.067,1.287,0.898,-0.088,-0.019,0.129,0.305,0.168,0.155,0.433,0.45,0.441,0.231,0.041,0.008,-0.042,-0.404,-0.09,0.047,-0.291,-0.209,-0.233,0.0,0.0,-0.131,-0.084,0.076,0.077,-0.11,0.0,-0.069,-0.898,-0.34,0.0,0.0,-0.129,0.075,-0.168,0.08,0.071,0.077,0.073,0.071,-0.047,-0.022,0.0,0.0,0.0,-0.052,0.0,0.0,0.0,-0.254,-0.359,-0.2,-0.225,0.338,0.368,-0.042,-0.408,-0.258,1.198,0.797,-0.352,-0.364,-0.037,0.301,-0.06,0.539,0.219,0.377,0.258,0.203,-0.31,-0.044,-0.261,-0.383,-0.059,-0.335,0.144,-0.258,-0.315,0.083
5392,1373158606,0.502,-0.666,-0.803,0.182,0.483,-0.702,0.498,-0.523,-1.903,3.412,-3.519,1.056,0.498,-0.523,-1.903,3.412,-3.519,1.056,-0.009,-0.227,0.471,0.354,0.07,-0.001,0.443,-0.297,0.343,0.516,0.615,-0.088,-0.019,0.493,-0.006,0.594,-0.155,0.152,0.161,0.152,-0.137,0.325,0.336,-0.042,-0.404,-0.09,0.326,-0.291,-0.209,-0.233,0.0,0.0,-0.051,-0.19,0.162,0.169,-0.115,0.0,-0.226,-0.203,-0.004,0.0,0.0,-0.002,0.17,-0.004,0.182,0.126,0.158,0.145,0.203,-0.244,-0.286,0.0,0.0,0.0,-0.268,0.0,0.0,0.0,-0.254,-0.359,-0.484,-0.605,0.196,0.28,-0.37,-0.408,-0.718,-0.293,-0.352,-0.352,-0.364,-0.346,0.216,-0.429,0.647,0.032,0.194,0.076,0.251,-0.843,-0.701,-0.261,-0.383,-0.059,-0.865,0.144,-0.258,-0.315,0.169
4718,1373158606,0.39,0.568,-0.964,0.19,0.177,-0.243,0.405,0.344,0.037,-1.662,1.652,-0.653,0.405,0.344,0.037,-1.662,1.652,-0.653,-0.009,-0.227,0.354,0.259,0.21,0.147,0.324,-0.297,0.237,0.288,0.499,-0.088,-0.019,0.357,0.14,0.463,0.001,0.254,0.3,0.274,0.019,0.21,0.008,-0.042,-0.404,-0.09,0.212,-0.291,-0.209,-0.233,0.0,0.0,-0.14,-0.167,0.13,0.131,-0.184,0.0,-0.172,0.04,-0.103,0.0,0.0,-0.175,0.134,-0.132,0.132,0.137,0.128,0.133,0.154,-0.179,-0.023,0.0,0.0,0.0,-0.171,0.0,0.0,0.0,-0.254,-0.359,-0.447,-0.526,0.258,0.303,-0.335,-0.408,-0.592,-0.028,-0.28,-0.352,-0.364,-0.323,0.239,-0.36,0.56,0.135,0.284,0.171,0.199,-0.743,-0.044,-0.261,-0.383,-0.059,-0.733,0.144,-0.258,-0.315,0.122
990,1373158606,-0.178,-0.531,-0.961,0.759,0.931,-0.317,-0.161,-0.907,1.37,-5.254,7.776,-3.152,-0.161,-0.907,1.37,-5.254,7.776,-3.152,-0.009,-0.227,0.337,0.231,0.396,0.36,0.293,-0.297,0.198,0.357,0.461,-0.088,-0.019,0.34,0.377,0.445,0.009,0.467,0.457,0.457,0.445,0.146,0.085,-0.042,-0.404,-0.09,0.158,-0.291,-0.209,-0.233,0.0,0.0,0.042,0.042,-0.247,-0.265,0.042,0.0,0.042,0.042,0.042,0.0,0.0,0.042,-0.298,0.042,-0.023,-0.319,-0.209,-0.253,-0.373,0.042,0.042,0.0,0.0,0.0,0.042,0.0,0.0,0.0,-0.254,-0.359,-0.345,-0.337,0.62,0.752,-0.184,-0.408,-0.359,-0.073,-0.213,-0.352,-0.364,-0.203,0.716,-0.289,0.394,0.495,0.558,0.483,0.99,-0.396,-0.113,-0.261,-0.383,-0.059,-0.424,0.144,-0.258,-0.315,-0.042
6498,1373158606,0.861,-0.387,-0.55,0.46,0.491,-0.056,0.803,-0.263,-0.084,0.189,-0.19,0.07,0.803,-0.263,-0.084,0.189,-0.19,0.07,-0.009,-0.227,0.338,0.248,0.216,0.152,0.318,-0.297,0.223,0.195,0.464,-0.088,-0.019,0.354,0.145,0.443,0.007,0.26,0.306,0.28,0.025,0.041,0.008,-0.042,-0.404,-0.09,0.047,-0.291,-0.209,-0.233,0.0,0.0,-0.003,-0.001,0.21,0.211,-0.002,0.0,-0.001,0.211,-0.006,0.0,0.0,-0.003,0.218,-0.006,0.214,0.223,0.204,0.214,0.262,-0.047,-0.023,0.0,0.0,0.0,-0.052,0.0,0.0,0.0,-0.254,-0.359,-0.365,-0.395,0.324,0.377,-0.217,-0.408,-0.434,0.062,-0.215,-0.352,-0.364,-0.223,0.315,-0.293,0.654,0.198,0.34,0.231,0.295,-0.31,-0.045,-0.261,-0.383,-0.059,-0.335,0.144,-0.258,-0.315,0.189


In [19]:
lambda_net_test_dataset_list[-1].as_pandas().head()

Unnamed: 0,seed,0-target,1-target,2-target,3-target,4-target,5-target,0-lstsq_lambda,1-lstsq_lambda,2-lstsq_lambda,3-lstsq_lambda,4-lstsq_lambda,5-lstsq_lambda,0-lstsq_target,1-lstsq_target,2-lstsq_target,3-lstsq_target,4-lstsq_target,5-lstsq_target,wb_0,wb_1,wb_2,wb_3,wb_4,wb_5,wb_6,wb_7,wb_8,wb_9,wb_10,wb_11,wb_12,wb_13,wb_14,wb_15,wb_16,wb_17,wb_18,wb_19,wb_20,wb_21,wb_22,wb_23,wb_24,wb_25,wb_26,wb_27,wb_28,wb_29,wb_30,wb_31,wb_32,wb_33,wb_34,wb_35,wb_36,wb_37,wb_38,wb_39,wb_40,wb_41,wb_42,wb_43,wb_44,wb_45,wb_46,wb_47,wb_48,wb_49,wb_50,wb_51,wb_52,wb_53,wb_54,wb_55,wb_56,wb_57,wb_58,wb_59,wb_60,wb_61,wb_62,wb_63,wb_64,wb_65,wb_66,wb_67,wb_68,wb_69,wb_70,wb_71,wb_72,wb_73,wb_74,wb_75,wb_76,wb_77,wb_78,wb_79,wb_80,wb_81,wb_82,wb_83,wb_84,wb_85,wb_86,wb_87,wb_88,wb_89,wb_90
7217,1373158606,0.715,0.432,0.981,-0.843,-0.74,-0.831,0.7,0.81,-1.561,6.082,-8.884,2.604,0.7,0.81,-1.561,6.082,-8.884,2.604,-0.009,-0.227,0.556,0.526,0.278,0.215,0.636,-0.297,0.52,0.241,0.682,-0.088,-0.019,0.632,0.208,0.648,0.074,0.321,0.366,0.341,0.102,0.52,0.009,-0.042,-0.404,-0.09,0.511,-0.291,-0.209,-0.233,0.0,0.0,-0.338,-0.381,0.18,0.179,-0.49,0.0,-0.422,0.199,-0.367,0.0,0.0,-0.423,0.185,-0.275,0.175,0.194,0.175,0.187,0.21,-0.462,-0.022,0.0,0.0,0.0,-0.438,0.0,0.0,0.0,-0.254,-0.359,-0.966,-1.24,0.355,0.399,-1.043,-0.408,-1.415,0.1,-0.708,-0.352,-0.364,-0.904,0.336,-0.707,0.623,0.232,0.379,0.267,0.277,-1.67,-0.045,-0.261,-0.383,-0.059,-1.635,0.144,-0.258,-0.315,0.158
8291,1373158606,-0.213,0.402,-0.761,-0.041,-0.451,-0.243,-0.205,0.455,-2.097,5.431,-8.404,3.565,-0.205,0.455,-2.097,5.431,-8.404,3.565,-0.009,-0.227,0.242,0.135,0.295,0.232,0.652,-0.297,0.102,0.962,0.37,-0.088,-0.019,0.583,0.231,0.352,0.008,0.353,0.38,0.364,0.032,0.048,0.777,-0.042,-0.404,-0.09,0.06,-0.291,-0.209,-0.233,0.0,0.0,0.065,0.065,-0.001,-0.001,-0.269,0.0,0.066,-0.583,0.06,0.0,0.0,-0.144,-0.001,0.064,-0.023,-0.001,-0.001,-0.001,-0.036,0.067,-0.602,0.0,0.0,0.0,0.067,0.0,0.0,0.0,-0.254,-0.359,-0.27,-0.273,0.272,0.3,-0.782,-0.408,-0.301,-0.964,-0.13,-0.352,-0.364,-0.568,0.234,-0.208,0.394,0.154,0.311,0.194,0.047,-0.351,-1.6,-0.261,-0.383,-0.059,-0.376,0.144,-0.258,-0.315,-0.07
4607,1373158606,0.514,-0.41,-0.766,-0.485,-0.225,-0.896,0.505,-0.089,-3.232,6.786,-9.263,3.078,0.505,-0.089,-3.232,6.786,-9.263,3.078,-0.009,-0.227,0.649,0.577,-0.077,-0.158,0.657,-0.297,0.553,0.765,0.76,-0.088,-0.019,0.674,-0.161,0.709,-0.229,0.319,0.043,0.172,-0.252,0.517,0.57,-0.042,-0.404,-0.09,0.524,-0.291,-0.209,-0.233,0.0,0.0,-0.265,-0.408,0.139,0.157,-0.425,0.0,-0.419,-0.447,-0.079,0.0,0.0,-0.344,0.16,-0.194,0.228,0.129,0.138,0.138,0.251,-0.451,-0.482,0.0,0.0,0.0,-0.422,0.0,0.0,0.0,-0.254,-0.359,-0.821,-1.081,0.15,0.308,-0.862,-0.408,-1.166,-0.694,-0.494,-0.352,-0.364,-0.75,0.25,-0.602,0.743,-0.121,0.097,-0.041,0.355,-1.313,-1.189,-0.261,-0.383,-0.059,-1.304,0.144,-0.258,-0.315,0.151
5114,1373158606,-0.373,0.948,0.872,0.284,-0.963,0.497,-0.347,0.491,3.377,-5.506,4.992,-1.751,-0.347,0.491,3.377,-5.506,4.992,-1.751,-0.009,-0.227,0.137,0.088,0.516,0.439,0.118,-0.297,0.071,0.651,0.313,-0.088,-0.019,0.149,0.436,0.244,0.244,0.6,0.595,0.6,0.376,0.042,0.009,-0.042,-0.404,-0.09,0.049,-0.291,-0.209,-0.233,0.0,0.0,-0.138,-0.09,-0.019,-0.051,-0.118,0.0,-0.075,-0.233,-0.011,0.0,0.0,-0.127,-0.098,-0.042,-0.182,-0.024,-0.024,-0.024,-0.195,-0.051,-0.024,0.0,0.0,0.0,-0.056,0.0,0.0,0.0,-0.254,-0.359,-0.19,-0.225,0.487,0.516,-0.033,-0.408,-0.258,0.29,0.044,-0.352,-0.364,0.02,0.454,-0.045,0.773,0.368,0.517,0.405,0.437,-0.31,-0.044,-0.261,-0.383,-0.059,-0.335,0.144,-0.258,-0.315,-0.332
1859,1373158606,0.664,-0.38,0.886,-0.641,0.325,0.344,0.522,0.349,-0.005,0.011,-0.012,0.004,0.522,0.349,-0.005,0.011,-0.012,0.004,-0.009,-0.227,0.259,0.083,0.284,0.221,0.214,-0.297,0.067,0.284,0.375,-0.088,-0.019,0.26,0.217,0.362,0.08,0.333,0.371,0.349,0.121,0.041,0.008,-0.042,-0.404,-0.09,0.048,-0.291,-0.209,-0.233,0.0,0.0,-0.001,-0.083,0.149,0.149,-0.0,0.0,-0.069,0.13,-0.002,0.0,0.0,-0.001,0.152,-0.002,0.146,0.158,0.147,0.154,0.167,-0.047,-0.022,0.0,0.0,0.0,-0.052,0.0,0.0,0.0,-0.254,-0.359,-0.264,-0.226,0.315,0.353,-0.101,-0.408,-0.258,0.056,-0.126,-0.352,-0.364,-0.12,0.288,-0.204,0.559,0.194,0.347,0.232,0.214,-0.31,-0.044,-0.261,-0.383,-0.059,-0.335,0.144,-0.258,-0.315,0.136


## Interpretation Network Training

In [None]:
(history_list, 
scores_list, 

function_values_complete_list, 
function_values_valid_list, 
function_values_test_list, 

inet_preds_list, 
inet_preds_valid_list, 
inet_preds_test_list, 

distrib_dict_list,
model_list) = calculate_interpretation_net_results(lambda_net_train_dataset_list, 
                                                   lambda_net_valid_dataset_list, 
                                                   lambda_net_test_dataset_list)

Trial 89 Complete [00h 02m 18s]
val_loss: 0.13189025223255157

Best val_loss So Far: 0.07661603391170502
Total elapsed time: 07h 13m 34s

Search: Running Trial #90

Hyperparameter    |Value             |Best Value So Far 
conv_block_1/ke...|3                 |3                 
conv_block_1/se...|False             |False             
conv_block_1/ma...|False             |True              
conv_block_1/dr...|0                 |0                 
conv_block_1/nu...|2                 |2                 
conv_block_1/nu...|2                 |2                 
conv_block_1/fi...|32                |32                
conv_block_1/fi...|512               |512               
conv_block_1/fi...|32                |32                
conv_block_1/fi...|32                |32                
dense_block_1/u...|False             |False             
dense_block_1/n...|3                 |3                 
dense_block_1/u...|32                |32                
dense_block_1/d...|0                 

## Evaluate Interpretation Net

In [None]:
if nas:
    for trial in history_list[-1]: 
        print(trial.summary())

In [None]:
if len(model_list) >= 1:
    print(model_list[-1].summary())
    print(model_list[-1].get_config())

In [None]:
scores_list[-1]

In [None]:
distrib_dict_list[-1]['MAE']

In [None]:
distrib_dict_list[-1]['R2']

In [None]:
index_min = int(np.argmin(distrib_dict_list[-1]['R2'].loc['predLambda_VS_lstsqTarget_test']))
polynomial_inet = inet_preds_test_list[-1][index_min]

print(distrib_dict_list[-1]['R2'].loc['inetPoly_VS_targetPoly_test'][index_min])

print_polynomial_from_coefficients(polynomial_inet)

In [None]:
index_min = int(np.argmin(distrib_dict_list[-1]['R2'].loc['predLambda_VS_lstsqTarget_test']))
#polynomial_target = lambda_net_test_dataset.get_lambda_net_by_lambda_index(index_min).target_polynomial

print(distrib_dict_list[-1]['R2'].loc['lstsqLambda_VS_targetPoly_test'][index_min])

polynomial_lambda = lambda_net_test_dataset.lstsq_lambda_pred_polynomial_list[index_min]
print_polynomial_from_coefficients(polynomial_lambda, force_complete_poly_representation=True)

In [None]:
index_min = int(np.argmin(distrib_dict_list[-1]['R2'].loc['predLambda_VS_lstsqTarget_test']))
#polynomial_target = lambda_net_test_dataset.get_lambda_net_by_lambda_index(index_min).target_polynomial
polynomial_target = lambda_net_test_dataset.target_polynomial_list[index_min]
print_polynomial_from_coefficients(polynomial_target, force_complete_poly_representation=True)

In [None]:
index_max = int(np.argmax(distrib_dict_list[-1]['R2'].loc['predLambda_VS_lstsqTarget_test']))
polynomial_inet = inet_preds_test_list[-1][index_max]

print(distrib_dict_list[-1]['R2'].loc['inetPoly_VS_targetPoly_test'][index_max])

print_polynomial_from_coefficients(polynomial_inet)

In [None]:
index_max = int(np.argmax(distrib_dict_list[-1]['R2'].loc['predLambda_VS_lstsqTarget_test']))
#polynomial_target = lambda_net_test_dataset.get_lambda_net_by_lambda_index(index_min).target_polynomial

print(distrib_dict_list[-1]['R2'].loc['lstsqLambda_VS_targetPoly_test'][index_max])

polynomial_lambda = lambda_net_test_dataset.lstsq_lambda_pred_polynomial_list[index_max]
print_polynomial_from_coefficients(polynomial_lambda, force_complete_poly_representation=True)

In [None]:
index_max = int(np.argmax(distrib_dict_list[-1]['R2'].loc['predLambda_VS_lstsqTarget_test']))
#polynomial_target = lambda_net_test_dataset.get_lambda_net_by_lambda_index(index_min).target_polynomial
polynomial_target = lambda_net_test_dataset.target_polynomial_list[index_max]
print_polynomial_from_coefficients(polynomial_target, force_complete_poly_representation=True)

In [None]:
r2_values_inet = distrib_dict_list[-1]['R2'].loc['inetPoly_VS_targetPoly_test']
print('Mean: ' + str(np.mean(r2_values_inet)) + ' (' + str(r2_values_inet.shape[0]) + ' Samples)')

r2_values_positive_inet = r2_values_inet[r2_values_inet>0]
print('Mean (only positive): ' + str(np.mean(r2_values_positive_inet)) + ' (' + str(r2_values_positive_inet.shape[0]) + ' Samples)')



In [None]:
r2_values_lstsq_lambda = distrib_dict_list[-1]['R2'].loc['lstsqLambda_VS_targetPoly_test']
print('Mean: ' + str(np.mean(r2_values_lstsq_lambda)) + ' (' + str(r2_values_inet.shape[0]) + ' Samples)')

r2_values_positive_lstsq_lambda = r2_values_lstsq_lambda[r2_values_lstsq_lambda>0]
print('Mean (only positive): ' + str(np.mean(r2_values_positive_lstsq_lambda)) + ' (' + str(r2_values_positive_lstsq_lambda.shape[0]) + ' Samples)')



In [None]:
sns.histplot(distrib_dict_list[-1]['MAE'].loc['inetPoly_VS_targetPoly_test'][distrib_dict_list[-1]['R2'].loc['inetPoly_VS_targetPoly_test'] > -50])


In [None]:
sns.histplot(distrib_dict_list[-1]['MAE'].loc['lstsqLambda_VS_targetPoly_test'][distrib_dict_list[-1]['R2'].loc['lstsqLambda_VS_targetPoly_test'] > -50])


In [None]:
p = sns.histplot(distrib_dict_list[-1]['R2'].loc['inetPoly_VS_targetPoly_test'][distrib_dict_list[-1]['R2'].loc['inetPoly_VS_targetPoly_test'] > -50], binwidth=0.2)
p.set(xlim=(-30, 1))

In [None]:
p = sns.histplot(distrib_dict_list[-1]['R2'].loc['inetPoly_VS_targetPoly_test'][distrib_dict_list[-1]['R2'].loc['inetPoly_VS_targetPoly_test'] > -50], binwidth=0.1)
p.set(xlim=(0, 1))

In [None]:
p = sns.histplot(distrib_dict_list[-1]['R2'].loc['lstsqLambda_VS_targetPoly_test'][distrib_dict_list[-1]['R2'].loc['lstsqLambda_VS_targetPoly_test'] > -50], binwidth=0.2)
p.set(xlim=(-10, 1))

In [None]:
p = sns.histplot(distrib_dict_list[-1]['R2'].loc['lstsqLambda_VS_targetPoly_test'][distrib_dict_list[-1]['R2'].loc['lstsqLambda_VS_targetPoly_test'] > -50], binwidth=0.1)
p.set(xlim=(0, 1))

In [None]:
if not nas:
    history = history_list[-1]

    plt.plot(history[list(history.keys())[1]])
    if consider_labels_training or evaluate_with_real_function:
        plt.plot(history[list(history.keys())[len(history.keys())//2+1]]) 
    plt.title('model ' + list(history.keys())[1])
    plt.ylabel('metric')
    plt.xlabel('epoch')
    plt.legend(['train', 'valid'], loc='upper left')
    plt.savefig('./data/results/' + path_identifier_interpretation_net_data + '/metric_' + path_identifier_interpretation_net_data + '_epoch_' + str(epochs_lambda).zfill(3) + '.png')


In [None]:
if not nas:
    history = history_list[-1]

    plt.plot(history['loss'])
    if consider_labels_training or evaluate_with_real_function:
        plt.plot(history['val_loss'])
    plt.title('model loss')
    plt.ylabel('loss')
    plt.xlabel('epoch')
    plt.legend(['train', 'valid'], loc='upper left')
    plt.savefig('./data/results/' + path_identifier_interpretation_net_data + '/loss_' + path_identifier_interpretation_net_data + '_epoch_' + str(epochs_lambda).zfill(3) + '.png')    


### Multi Epoch/Sampes Analysis

### Generate Comparison Plots

In [None]:
if len(scores_list) > 1:
    plot_metric_list = ['MAE FV', 'RMSE FV', 'MAPE FV', 'R2 FV', 'RAAE FV', 'RMAE FV']

    generate_inet_comparison_plot(scores_list, plot_metric_list)

In [None]:
if len(scores_list) > 1:
    plot_metric_list = ['MAE FV']

    generate_inet_comparison_plot(scores_list, plot_metric_list)

In [None]:
if len(scores_list) > 1:
    plot_metric_list = ['R2 FV']

    generate_inet_comparison_plot(scores_list, plot_metric_list, ylim=(-5, 1))

#### Generate and Analyze Predictions for Random Function

In [None]:
index = 5

polynomial_target = lambda_net_test_dataset.target_polynomial_list[index]
polynomial_lstsq_target = lambda_net_test_dataset.lstsq_target_polynomial_list[index]
polynomial_lstsq_lambda = lambda_net_test_dataset.lstsq_lambda_pred_polynomial_list[index]
polynomial_inet = inet_preds_test_list[-1][index]

print('Target Poly:')
print_polynomial_from_coefficients(polynomial_target, force_complete_poly_representation=True, round_digits=4)
print('LSTSQ Target Poly:')
print_polynomial_from_coefficients(polynomial_lstsq_target, force_complete_poly_representation=True, round_digits=4)
print('LSTSQ Lambda Poly:')
print_polynomial_from_coefficients(polynomial_lstsq_lambda, force_complete_poly_representation=True, round_digits=4)
print('I-Net Poly:')
print_polynomial_from_coefficients(polynomial_inet, round_digits=4)


In [None]:
plot_and_save_single_polynomial_prediction_evaluation(lambda_net_test_dataset_list, 
                                                      function_values_test_list, 
                                                      inet_preds_test_list,
                                                      rand_index=index, 
                                                      plot_type=1)

In [None]:
plot_and_save_single_polynomial_prediction_evaluation(lambda_net_test_dataset_list, 
                                                      function_values_test_list, 
                                                      inet_preds_test_list,
                                                      rand_index=index, 
                                                      plot_type=2)

In [None]:
plot_and_save_single_polynomial_prediction_evaluation(lambda_net_test_dataset_list, 
                                                      function_values_test_list, 
                                                      inet_preds_test_list,
                                                      rand_index=index, 
                                                      plot_type=3)

# BENCHMARK (RANDOM GUESS) EVALUATION

In [None]:
list_of_random_polynomials = np.random.uniform(low=-10, high=10, size=(len(lambda_net_test_dataset_list[-1]), sparsity))

In [None]:
true_fv_test = parallel_fv_calculation_from_polynomial(lambda_net_test_dataset_list[-1].target_polynomial_list, lambda_net_test_dataset_list[-1].test_data_list, force_complete_poly_representation=True)
random_fv_test = parallel_fv_calculation_from_polynomial(list_of_random_polynomials, lambda_net_test_dataset_list[-1].test_data_list, force_complete_poly_representation=True)

In [None]:
print('Random Guess Error Coefficients: ' + str(np.round(mean_absolute_error(lambda_net_test_dataset_list[-1].target_polynomial_list, list_of_random_polynomials), 4)))

In [None]:
print('Random Guess Error FVs: ' + str(np.round(mean_absolute_error_function_values(true_fv_test, random_fv_test), 4)))

# BENCHMARK (EDUCATED GUESS/MEAN PREDICTION) EVALUATION

In [None]:
true_fv_train = parallel_fv_calculation_from_polynomial(lambda_net_test_dataset_list[-1].target_polynomial_list, lambda_net_test_dataset_list[-1].test_data_list, force_complete_poly_representation=True)

mean_fv = np.mean(true_fv_train)
mean_fv_pred_test = [mean_fv for _ in range(true_fv_test.shape[0])]

In [None]:
print('Educated Guess/Mean Prediction Error FVs: ' + str(np.round(mean_absolute_error_function_values(true_fv_test, mean_fv_pred_test), 4)))

In [None]:
%%script false --no-raise-error

base_model = generate_base_model()
random_evaluation_dataset = np.random.uniform(low=x_min, high=x_max, size=(random_evaluation_dataset_size, n))
#random_evaluation_dataset = lambda_train_input_train_split[0]#lambda_train_input[0] #JUST [0] HERE BECAUSE EVALUATION ALWAYS ON THE SAME DATASET FOR ALL!!
list_of_monomial_identifiers_numbers = np.array([list(monomial_identifiers) for monomial_identifiers in list_of_monomial_identifiers]).astype(float)


loss_function = mean_absolute_error_tf_fv_lambda_extended_wrapper(random_evaluation_dataset, list_of_monomial_identifiers_numbers, base_model)      

X_train = X_train_list[-1].values[:,1:]
y_train = y_train_list[-1].values[:,2:]

#X_train = X_train[:,1:]
y_train_model = np.hstack((y_train, X_train))

print('seed_in_inet_training = ' + str(seed_in_inet_training), loss_function(y_train_model, y_train))


seed_in_inet_training = False

loss_function = mean_absolute_error_tf_fv_lambda_extended_wrapper(random_evaluation_dataset, list_of_monomial_identifiers_numbers, base_model)      

X_train = X_train_list[-1].values[:,1:]
y_train = y_train_list[-1].values[:,2:]

X_train = X_train[:,1:]
y_train_model = np.hstack((y_train, X_train))

print('seed_in_inet_training = ' + str(seed_in_inet_training), loss_function(y_train_model, y_train))

seed_in_inet_training = True



In [None]:
if use_gpu:
    from numba import cuda 
    device = cuda.get_current_device()
    device.reset()