In [5]:
#@title **Main**
from urllib.request import urlopen
import json
import numpy as np
import pandas as pd
import os
import copy
import math
import statistics
import sklearn.metrics as metrics
 
# Evitar truncar data mostrada al usar jupyter notebook
pd.set_option('display.max_rows', None)
pd.set_option('display.max_columns', None)
 
# Constante que aloja el diccionario JSON con toda la data
DATA = None

# Obtener data JSON
if os.path.exists('./out/dataout.json'):
    DATA = json.load(open('./out/dataout.json', 'r'))
else:
    data_url = urlopen('http://nutriexcel.cl/UMDU/dataout_v2.json')
    DATA = json.loads(data_url.read())
 
# Labels base de las columnas
LABELS_BASE = {
    # Parámetros del alumno (Target)
    'p1':                            ['p1'],
    'p2':                            ['p2'],
    'np':                            ['np'],
    'p1p2':                          ['p1p2'], # Promedio p1p2 y p2p2
    'p2p2':                          ['p2p2'],
    
    # Parámetros del laboratorio (Features)
    'grade':                         ['g_lab#'],
    'attempts':                      ['a_lab#'],
    'usedtime':                      ['ut_lab#'],
    'activetime':                    ['act_lab#'],
    'disconnections':                ['dis_lab#'],      # log
    'compilationtime':               ['ct_lab#'],
    'runtimedebuggingtime':          ['rt_lab#'],
    'compilationtimeratio':          ['ctr_lab#'],
    'runtimedebuggingtimeratio':     ['rtr_lab#'],
    'errorsreductionratio':          ['err_lab#'],
    'compilationerrorsratio':        ['cer_lab#'],
    'activequartiles':               ['actq1_lab#','actq2_lab#','actq3_lab#'],
    'questionsdifficulty':           ['qd$_lab#'],
    'questionsgrades':               ['qg$_lab#'],      # Promedio
    'questionsattempts':             ['qat$_lab#'],     # Sumar - Max   # log
    'questionsactivetime':           ['qact$_lab#'],    # Promedio
    'questionsavgtime':              ['qavt$_lab#'],    # Promedio
    'questionsmaxerrors':            ['qme$_lab#'],     # Max
    'questionsmaxconsecutiveerrors': ['qmce$_lab#'],    # Max
    'questionsmaxsimilarityratio':   ['qmsr$_lab#'],    # Promedio
    'questionscorrectness':          ['qc$_lab#']       # Promedio
}
 
 
# Cantidad de preguntas por lab
LABS_LENGTHS = {
    '1': 7,
    '2': 6,
    '3': 6,
    '4': 5,
    '5': 3
}
 
def get_labels(labs:list, obj_param:list, params:list):
    '''Retorna una lista con los nombres de las columnas correspondientes.'''
    labels = []
    
    if not obj_param == None:
        for obj_p in obj_param:
            labels.extend(LABELS_BASE[obj_p])
 
    for lab in labs:
        for param in params:
            label_base = LABELS_BASE[param]
            for lb in label_base:
                aux_label = lb.replace('#', str(lab))
                if '$' in aux_label:
                    for i in range(LABS_LENGTHS[str(lab)]):
                        labels.extend([aux_label.replace('$', str(i + 1))])
                else:
                    labels.extend([aux_label])
    return labels
                    
 
def load_data(filepath = './out/dataout.json'):
    '''Retorna un diccionario importado desde un archivo JSON.'''
    return readJSON(filepath)
 
 
def convert_to_dataframe(arr:list, labels:list=None, ids_idx:list=None):
    '''Retorna un Pandas Dataframe.'''
    return pd.DataFrame(np.array(arr), columns=labels, index=ids_idx)
 
 
def get_custom_dataframe(data:dict, labs:list, obj_param:list, params:list, labels:bool=False, index:str=None):
    '''Retorna un DataFrame de Pandas con etiquetas.'''
    if params == 'all':
        params = list(LABELS_BASE.keys())[5:]
        
    data, ids_idx = get_custom_data(labs, obj_param, params, data, index)
    if labels:
        return convert_to_dataframe(data, labels=get_labels(labs, obj_param, params), ids_idx=ids_idx)
    else:
        return convert_to_dataframe(data, labels=None, ids_idx=ids_idx)
 
    
 
 
def get_custom_data(labs:list, obj_param:list, params:list, data:dict, index:str):
    dataout = []
    idxs = []
    for v1 in data['courses'].values():
        for k2,v2 in v1['students'].items():
            if index == 'id':
                idxs.append(k2)
            elif not index == None:
                idxs.append(v2[index])
            
            studentdata = []
 
            if not obj_param == None:
                for obj_p in obj_param:
                    studentdata.extend([v2[obj_p]])
            
            for labnumber in labs:
                labkey = str(list(v2['labs'].keys())[int(labnumber) - 1])
                
                for param in params:
                    val = v2['labs'][labkey][param]
                    if isinstance(val, list):
                        studentdata.extend(val)
                    else:
                        studentdata.extend([val])
            
            dataout.append(studentdata)
 
    if len(idxs) == 0:
        idxs = None
 
    return dataout, idxs
 
 
def readJSON(filename:str):
    print('Leyendo archivo: \'' + filename + '\'')
    return json.load(open(filename, 'r'))
 
# --------------------------------------------------------------------------
 
def norm_log(df):
    min_value = min(df)
    for i in range(len(df)):
        df[i] = math.log(df[i] - min_value + 1)
 
    return df
 
# --------------------------------------------------------------------------
 
def apply(df:pd.core.frame.DataFrame, columns, func, c=None, replace:bool=True):
    '''
    Aplica una función dada a una serie de parámetros dados.
    df: Dataframe.
    func: Función a aplicar (Ej.: 'sum', 'max', 'math.log', etc.).
    params: Parámetro o lista de parámetros al cual/a los cuales aplicar la función. Si el parámetro param tiene un signo '?' al final, 
            se considerarán todos aquellos que empiecen con param. Si es una lista de parámetros, cada parámetro debe ser el nombre exacto,
            es decir, no deben llevar '?'.
    c: constante o parámetro a utilizar en el cálculo (Ej: sumar constante c; log base c). Se debe omitir si no aplica.
    replace: Si es True, reemplaza la columna o columnas a las cuales se la aplica la función. Si es False, se agregan nuevas columnas.
    '''
 
    def one_param(df_new:pd.core.frame.DataFrame):
        if not columns[-1] == '?':
            try:
                aux_column = function_handler(func, df_new[columns], c)
            except KeyError:
                raise Exception('Columna ' + columns + ' no existe.')
 
            aux_column = pd.DataFrame(aux_column)
            insert_columns(df_new, aux_column, [columns], replace, func.__name__, c)
            
            return df_new
        else:
            labels = list(df_new.columns) + ['???']
            target_cols = []
            target_cols_names = []
            fg_newarr = True
            fg_endarr = False
            i = 0
 
            while i < len(labels):
                if labels[i][0] == columns[0] and columns[:-1] in labels[i]:
                    target_cols.append(i)
                    target_cols_names.append(labels[i])
                    fg_newarr = False
                elif not fg_newarr:
                    fg_endarr = True
                
                if not fg_newarr and fg_endarr:
                    fg_newarr = True
                    fg_endarr = False
                    aux_columns = []
                    
                    for row in df_new.values:
                        aux_row = [row[col] for col in target_cols]
                        aux_columns.append(function_handler(func, aux_row, c))
 
                    aux_columns = pd.DataFrame(aux_columns)
                    insert_columns(df_new, aux_columns, target_cols_names, replace, func.__name__, c)
 
                    if replace:
                        i -= len(target_cols)
                        labels = list(df_new.columns) + ['???']
 
                    target_cols = []
                    target_cols_names = []
                i += 1
            
            return df_new
 
 
    def multi_param(df_new:pd.core.frame.DataFrame):
        aux_columns = []
        target_cols = [df_new.columns.get_loc(col) for col in columns]
 
        for row in df_new.values:
            try:
                aux_row = [row[col] for col in range(len(target_cols))]
            except KeyError:
                raise Exception('Columna ' + columns + ' no existe.')
            
            aux_columns.append(function_handler(func, aux_row, c))
 
        aux_columns = pd.DataFrame(aux_columns)
        insert_columns(df_new, aux_columns, columns, replace, func.__name__, c)
 
        return df_new
 
    
    def function_handler(func, col, c=None):
        arr = copy.deepcopy(col)
        try:
            if c == None:
                return func(arr)
            else:
                return func(arr, c)
        except TypeError:
            try:
                return [function_handler(func, datum, c) for datum in arr]
            except TypeError:
                raise Exception('Operación sin sentido: x = ' + func.__name__ + '(x).')
    
 
    def insert_columns(df_new, sub_df, labels, replace, func_name, c):
        const_name = ''
 
        if not c == None:
                const_name = ',' + str(c)
 
        if len(sub_df.columns) == 1:
            merg_name = labels[0]
            
            if len(labels) > 1:
                merg_name = get_merged_name(labels[0])
 
            new_name = func_name + '(' + merg_name + const_name + ')'
 
            if replace:
                df_new[labels[0]] = sub_df
                df_new.rename(columns={labels[0]: new_name}, inplace=True)
 
                if len(labels) > 1:
                    for i in range(1, len(labels)):
                        df_new.pop(labels[i])
            else:
                df_new[new_name] = sub_df
        else:
            new_names = [func_name + '(' + cur_name + const_name + ')' for cur_name in labels]
 
            if replace:
                for i in range(len(labels)):
                    df_new[labels[i]] = sub_df[i]
                    df_new.rename(columns={labels[i]: new_names[i]}, inplace=True)
            else:
                for i in range(len(labels)):
                    df_new[new_names[i]] = sub_df[i]
 
 
    def get_merged_name(basename:str):
        merged_name = ''
        flag = True
        for i in range(len(basename)):
            if flag and basename[i].isnumeric():
                merged_name += '$'
                flag = False
            else:
                merged_name += basename[i]
 
        return merged_name
 
 
    def are_valid_column_names(columns):
        if type(columns) == list:
            for col in columns:
                if '?' in col:
                    raise Exception('Nombres de columna en lista no deben contener \'?\'.')
        
        return True
 
 
    df_new = copy.deepcopy(df)
    are_valid_column_names(columns)
    if type(columns) == list:
        return multi_param(df_new)
    else:
        return one_param(df_new)
 
 
def remove_col(df, column:str):
    if column[-1] == '?':
        for x in df.columns:
            if x[0] == column[0] and column[:-1] in x:
                df.pop(x)
    else:
        df.pop(column)
 
 
def normalise_row(df):
    df_aux = copy.deepcopy(df)
 
    for i in range(len(df_aux)):
        min_value = min(df_aux.iloc[i])
        max_value = max(df_aux.iloc[i])
 
        df_aux.iloc[i] = (df_aux.iloc[i] - min_value) / (max_value - min_value)
 
    return df_aux
 
 
def normalise_col(df, norm_params=None):
    norm_params_aux = {}
    df_aux = copy.deepcopy(df)
 
    if norm_params == None:
        for col in df_aux.columns:
            min_value = min(df_aux[col])
            max_value = max(df_aux[col])
            
            norm_params_aux[col] = {
                'min_value': min_value,
                'max_value': max_value
            }
 
            for i in range(len(df_aux[col])):
                if not max_value - min_value == 0:
                    df_aux[col].iloc[i] = (df_aux[col].iloc[i] - min_value) / (max_value - min_value)
                else:
                    df_aux[col].iloc[i] = 0
 
        return df_aux, norm_params_aux
    else:
        for col in df_aux.columns:
            for i in range(len(df_aux[col])):
                if not norm_params[col]['max_value'] - norm_params[col]['min_value'] == 0:
                    df_aux[col].iloc[i] = (df_aux[col].iloc[i] - norm_params[col]['min_value']) / (norm_params[col]['max_value'] - norm_params[col]['min_value'])
                else:
                    df_aux[col].iloc[i] = 0
        return df_aux
 
 
def normalise_log(df):
    df_aux = copy.deepcopy(df)
 
    for i in range(len(df_aux)):
        for j in range(len(df_aux.iloc[i])):
            df_aux.iloc[i][j] = math.log(df_aux.iloc[i][j]) if df_aux.iloc[i][j] > 0 else 0
 
    return df_aux

In [None]:
print(len(datalab1_all.columns))
print(len(datalab2_all.columns))
print(len(datalab3_all.columns))
print(len(datalab4_all.columns))

In [None]:
print(len(datalab1.columns))
print(len(datalab2.columns))
print(len(datalab3.columns))
print(len(datalab4.columns))

In [None]:
datalab1.head()

In [6]:
#@title **Data preparation**

# Get dataframe
datalab1_all = get_custom_dataframe(DATA, [1], ['p1p2','p2p2'], 'all', labels=True, index=None)

datalab1 = copy.deepcopy(datalab1_all)
 
# Remove questionsdifficulty
remove_col(datalab1, 'qd?')
# Group columns
datalab1_all = apply(datalab1_all, ['p1p2','p2p2'], statistics.mean)
datalab1 = apply(datalab1, ['p1p2','p2p2'], statistics.mean)
datalab1 = apply(datalab1, 'dis_lab1', norm_log)
datalab1 = apply(datalab1, 'qg?', statistics.mean)
datalab1 = apply(datalab1, 'qat?', sum, replace=False)
datalab1 = apply(datalab1, 'sum(qat$_lab1)', norm_log, replace=False)
datalab1 = apply(datalab1, 'qat?', max)
datalab1 = apply(datalab1, 'qact?', statistics.mean)
datalab1 = apply(datalab1, 'qavt?', statistics.mean)
datalab1 = apply(datalab1, 'qme?', max)
datalab1 = apply(datalab1, 'qmce?', max)
datalab1 = apply(datalab1, 'qmsr?', statistics.mean)
datalab1 = apply(datalab1, 'qc?', statistics.mean)
aux = datalab1['act_lab1'] / datalab1['sum(qat$_lab1)']
for i in range(len(aux)):
    if not aux[i] > 0:
        aux[i] = 0
datalab1['avgtime_lab1'] = aux
datalab1 = datalab1.round(4)
 
 
# Get dataframe
datalab2_all = get_custom_dataframe(DATA, [2], ['p1p2','p2p2'], 'all', labels=True, index=None)
 
datalab2 = copy.deepcopy(datalab2_all)
 
# Remove questionsdifficulty
remove_col(datalab2, 'qd?')
# Group columns
datalab2_all = apply(datalab2_all, ['p1p2','p2p2'], statistics.mean)
datalab2 = apply(datalab2, ['p1p2','p2p2'], statistics.mean)
datalab2 = apply(datalab2, 'dis_lab2', norm_log)
datalab2 = apply(datalab2, 'qg?', statistics.mean)
datalab2 = apply(datalab2, 'qat?', sum, replace=False)
datalab2 = apply(datalab2, 'sum(qat$_lab2)', norm_log, replace=False)
datalab2 = apply(datalab2, 'qat?', max)
datalab2 = apply(datalab2, 'qact?', statistics.mean)
datalab2 = apply(datalab2, 'qavt?', statistics.mean)
datalab2 = apply(datalab2, 'qme?', max)
datalab2 = apply(datalab2, 'qmce?', max)
datalab2 = apply(datalab2, 'qmsr?', statistics.mean)
datalab2 = apply(datalab2, 'qc?', statistics.mean)
aux = datalab2['act_lab2'] / datalab2['sum(qat$_lab2)']
for i in range(len(aux)):
    if not aux[i] > 0:
        aux[i] = 0
datalab2['avgtime_lab2'] = aux
datalab2 = datalab2.round(4)
 
 
# Get dataframe
datalab3_all = get_custom_dataframe(DATA, [3], ['p1p2','p2p2'], 'all', labels=True, index=None)
 
datalab3 = copy.deepcopy(datalab3_all)
 
# Remove questionsdifficulty
remove_col(datalab3, 'qd?')
# Group columns
datalab3_all = apply(datalab3_all, ['p1p2','p2p2'], statistics.mean)
datalab3 = apply(datalab3, ['p1p2','p2p2'], statistics.mean)
datalab3 = apply(datalab3, 'dis_lab3', norm_log)
datalab3 = apply(datalab3, 'qg?', statistics.mean)
datalab3 = apply(datalab3, 'qat?', sum, replace=False)
datalab3 = apply(datalab3, 'sum(qat$_lab3)', norm_log, replace=False)
datalab3 = apply(datalab3, 'qat?', max)
datalab3 = apply(datalab3, 'qact?', statistics.mean)
datalab3 = apply(datalab3, 'qavt?', statistics.mean)
datalab3 = apply(datalab3, 'qme?', max)
datalab3 = apply(datalab3, 'qmce?', max)
datalab3 = apply(datalab3, 'qmsr?', statistics.mean)
datalab3 = apply(datalab3, 'qc?', statistics.mean)
aux = datalab3['act_lab3'] / datalab3['sum(qat$_lab3)']
for i in range(len(aux)):
    if not aux[i] > 0:
        aux[i] = 0
datalab3['avgtime_lab3'] = aux
datalab3 = datalab3.round(4)
 
 
# Get dataframe
datalab4_all = get_custom_dataframe(DATA, [4], ['p1p2','p2p2'], 'all', labels=True, index=None)
 
datalab4 = copy.deepcopy(datalab4_all)
 
# Remove questionsdifficulty
remove_col(datalab4, 'qd?')
# Group columns
datalab4_all = apply(datalab4_all, ['p1p2','p2p2'], statistics.mean)
datalab4 = apply(datalab4, ['p1p2','p2p2'], statistics.mean)
datalab4 = apply(datalab4, 'dis_lab4', norm_log)
datalab4 = apply(datalab4, 'qg?', statistics.mean)
datalab4 = apply(datalab4, 'qat?', sum, replace=False)
datalab4 = apply(datalab4, 'sum(qat$_lab4)', norm_log, replace=False)
datalab4 = apply(datalab4, 'qat?', max)
datalab4 = apply(datalab4, 'qact?', statistics.mean)
datalab4 = apply(datalab4, 'qavt?', statistics.mean)
datalab4 = apply(datalab4, 'qme?', max)
datalab4 = apply(datalab4, 'qmce?', max)
datalab4 = apply(datalab4, 'qmsr?', statistics.mean)
datalab4 = apply(datalab4, 'qc?', statistics.mean)
aux = datalab4['act_lab4'] / datalab4['sum(qat$_lab4)']
for i in range(len(aux)):
    if not aux[i] > 0:
        aux[i] = 0
datalab4['avgtime_lab4'] = aux
datalab4 = datalab4.round(4)

In [7]:
#@title **Parameters**

# Objective vector
TARGET = 'mean(p$p2)'
NORM_TYPE = 'col'
N_FEATURES = 5
 
 
# Import needed libraries ----------------------------------------
from sklearn.model_selection import GridSearchCV, train_test_split
from sklearn.pipeline import Pipeline
from sklearn.feature_selection import RFE, SelectFromModel
from sklearn.ensemble import GradientBoostingRegressor
import sklearn.metrics as metrics
from sklearn.model_selection import KFold
 
random_state = None # Random state for train_test_split

In [8]:
datalab1.head()

Unnamed: 0,mean(p$p2),g_lab1,a_lab1,ut_lab1,act_lab1,norm_log(dis_lab1),ct_lab1,rt_lab1,ctr_lab1,rtr_lab1,err_lab1,cer_lab1,actq1_lab1,actq2_lab1,actq3_lab1,mean(qg$_lab1),max(qat$_lab1),mean(qact$_lab1),mean(qavt$_lab1),max(qme$_lab1),max(qmce$_lab1),mean(qmsr$_lab1),mean(qc$_lab1),sum(qat$_lab1),norm_log(sum(qat$_lab1)),avgtime_lab1
0,2.0,7.0,1.0,52870.0,2144.0,1.0986,673.0,292.0,0.3139,0.1362,0.4118,0.5667,0.2096,0.2113,0.2129,1.0,11.0,137.8571,32.9762,9.0,9.0,0.8978,0.8764,30.0,3.434,71.4667
1,2.25,7.0,1.0,12418.0,3343.0,0.6931,291.0,752.0,0.087,0.2249,0.6471,0.4571,0.0081,0.0335,0.0357,1.0,13.0,226.0,70.2262,4.0,4.0,0.6594,0.8201,35.0,3.5835,95.5143
2,1.25,7.0,1.0,217028.0,7613.0,2.4849,261.0,1664.0,0.0343,0.2186,0.7727,0.4364,0.5266,0.6602,0.666,1.0,22.0,463.2857,71.4592,25.0,4.0,0.7856,0.6715,55.0,4.0254,138.4182
3,3.0,7.0,1.0,1925.0,1925.0,0.0,337.0,1595.0,0.1751,0.8286,0.5,0.4,0.0342,0.0352,0.0366,1.0,6.0,288.1429,88.6286,5.0,3.0,0.927,0.8275,25.0,3.2581,77.0
4,2.0,7.0,1.0,4792.0,2771.0,1.3863,881.0,651.0,0.3179,0.2349,0.5294,0.5312,0.6627,0.665,0.6678,1.0,13.0,222.0,46.158,9.0,9.0,0.9148,0.8259,32.0,3.4965,86.5938


In [None]:
datalab1.head()

In [None]:
#@title **Scale features**
 
# Scale features -------------------------------------------------
from sklearn.preprocessing import StandardScaler

scaler1 = StandardScaler()
scaler2 = StandardScaler()
scaler3 = StandardScaler()
scaler4 = StandardScaler()
scaler_all = StandardScaler()

datalab1 = datalab1[[TARGET]].join(pd.DataFrame(scaler1.fit_transform(datalab1), columns=datalab1.columns)[datalab1.columns[1:]])
datalab2 = datalab2[[TARGET]].join(pd.DataFrame(scaler2.fit_transform(datalab2), columns=datalab2.columns)[datalab2.columns[1:]])
datalab3 = datalab3[[TARGET]].join(pd.DataFrame(scaler3.fit_transform(datalab3), columns=datalab3.columns)[datalab3.columns[1:]])
datalab4 = datalab4[[TARGET]].join(pd.DataFrame(scaler4.fit_transform(datalab4), columns=datalab4.columns)[datalab4.columns[1:]])

In [None]:
#@title **Grid/Random-SearchCV process**
 
def run_process(dataset, grid_cv, target=TARGET):
    X, y = dataset.drop(target, axis=1), np.array(dataset[target])
   
    grid_cv.fit(X,y)
 
    try:
        print('R2-test-fit:', max(grid_cv.cv_results_['mean_test_score']))
    except:
        pass

    try:
        X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.33)
        grid_cv.best_estimator_.fit(X_train, y_train)
        print('R2-test', grid_cv.best_estimator_.score(X_test, y_test))
        print('MSE-test', metrics.mean_squared_error(y_test,grid_cv.best_estimator_.predict(X_test)))

        print('Best params:', grid_cv.best_params_)

        selected_features = X.columns[grid_cv.best_estimator_.steps[0][-1].get_support()]
        print('Selected features:', list(selected_features))

        return list(selected_features)
    except:
        return list(dataset.columns[1:])



---



In [None]:
#@title **SVR - Recursive Features Elimination**

from sklearn.svm import SVR

sel_estimator = SVR(kernel='linear')
selector = RFE(sel_estimator)
estimator = SVR()

pipe = Pipeline([
    ('sel', selector),
    ('est', estimator)
])

params = {
    'sel__n_features_to_select' : [5],
    'sel__step'                 : [1,2],
    'est__C'                    : [0.01,0.1,1],
    'est__gamma'                : ['scale','auto'],
    'est__kernel'               : ['linear','poly','rbf']
}

grid_svr = GridSearchCV(estimator=pipe,
                        param_grid=params,
                        scoring='r2',
                        verbose=1,
                        n_jobs=-1,
                        return_train_score=True,
                        cv=KFold(n_splits=5, shuffle=True))

datalab1

In [None]:
selected_features_svr_1 = run_process(datalab1,grid_svr)

In [None]:
selected_features_svr_1 = run_process(datalab1,grid_svr)

In [None]:
selected_features_svr_1 = run_process(datalab1,grid_svr)

In [None]:
selected_features_svr_1 = run_process(datalab1,grid_svr)

In [None]:
selected_features_svr_1 = run_process(datalab1,grid_svr)

In [None]:
selected_features_svr_1 = run_process(datalab1,grid_svr)

In [None]:
selected_features_svr_1 = run_process(datalab1,grid_svr)

In [None]:
selected_features_svr_1 = run_process(datalab1,grid_svr)

In [None]:
selected_features_svr_1 = run_process(datalab1,grid_svr)

In [None]:
selected_features_svr_1 = run_process(datalab1,grid_svr)



---



datalab2

In [None]:
selected_features_svr_2 = run_process(datalab2,grid_svr)

In [None]:
selected_features_svr_2 = run_process(datalab2,grid_svr)

In [None]:
selected_features_svr_2 = run_process(datalab2,grid_svr)

In [None]:
selected_features_svr_2 = run_process(datalab2,grid_svr)

In [None]:
selected_features_svr_2 = run_process(datalab2,grid_svr)

In [None]:
selected_features_svr_2 = run_process(datalab2,grid_svr)

In [None]:
selected_features_svr_2 = run_process(datalab2,grid_svr)

In [None]:
selected_features_svr_2 = run_process(datalab2,grid_svr)

In [None]:
selected_features_svr_2 = run_process(datalab2,grid_svr)

In [None]:
selected_features_svr_2 = run_process(datalab2,grid_svr)



---



datalab3

In [None]:
selected_features_svr_3 = run_process(datalab3,grid_svr)

In [None]:
selected_features_svr_3 = run_process(datalab3,grid_svr)

In [None]:
selected_features_svr_3 = run_process(datalab3,grid_svr)

In [None]:
selected_features_svr_3 = run_process(datalab3,grid_svr)

In [None]:
selected_features_svr_3 = run_process(datalab3,grid_svr)

In [None]:
selected_features_svr_3 = run_process(datalab3,grid_svr)

In [None]:
selected_features_svr_3 = run_process(datalab3,grid_svr)

In [None]:
selected_features_svr_3 = run_process(datalab3,grid_svr)

In [None]:
selected_features_svr_3 = run_process(datalab3,grid_svr)

In [None]:
selected_features_svr_3 = run_process(datalab3,grid_svr)



---



datalab4

In [None]:
selected_features_svr_4 = run_process(datalab4,grid_svr)

In [None]:
selected_features_svr_4 = run_process(datalab4,grid_svr)

In [None]:
selected_features_svr_4 = run_process(datalab4,grid_svr)

In [None]:
selected_features_svr_4 = run_process(datalab4,grid_svr)

In [None]:
selected_features_svr_4 = run_process(datalab4,grid_svr)

In [None]:
selected_features_svr_4 = run_process(datalab4,grid_svr)

In [None]:
selected_features_svr_4 = run_process(datalab4,grid_svr)

In [None]:
selected_features_svr_4 = run_process(datalab4,grid_svr)

In [None]:
selected_features_svr_4 = run_process(datalab4,grid_svr)

In [None]:
selected_features_svr_4 = run_process(datalab4,grid_svr)



---



In [None]:
estimator = SVR()

params = {
    'C'         : [0.01,0.1,1],
    'gamma'     : ['scale','auto'],
    'kernel'    : ['linear','poly','rbf']
}

grid_svr = GridSearchCV(estimator=estimator,
                        param_grid=params,
                        scoring='r2',
                        verbose=1,
                        n_jobs=-1,
                        return_train_score=True,
                        cv=KFold(n_splits=5, shuffle=True))

In [3]:
selected_features_svr_1 = ['mean(qmsr$_lab1)','actq2_lab1','actq3_lab1','mean(qg$_lab1)','actq1_lab1']
selected_features_svr_2 = ['max(qat$_lab2)','mean(qact$_lab2)','mean(qmsr$_lab2)','g_lab2','actq1_lab2']
selected_features_svr_3 = ['g_lab3','mean(qmsr$_lab3)','act_lab3','mean(qact$_lab3)','avgtime_lab3']
selected_features_svr_4 = ['max(qat$_lab4)','err_lab4','mean(qact$_lab4)','cer_lab4','rt_lab4']

datalab1_2

In [4]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [5]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [6]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [7]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [8]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [9]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [10]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [11]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [12]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [13]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined



---



datalab1_2_3

In [14]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [15]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [16]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [17]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [18]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [19]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [20]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [21]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [22]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [23]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

datalab1_2_3_4

In [24]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [25]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [26]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [27]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [28]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [29]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [30]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [31]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [32]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

In [33]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined



---



In [34]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
run_process(dataset,grid_svr)

NameError: name 'datalab1' is not defined

Plots

In [35]:
dataset = datalab1[[TARGET] + selected_features_svr_1].join(datalab2[selected_features_svr_2]).join(datalab3[selected_features_svr_3]).join(datalab4[selected_features_svr_4])
X, y = dataset.drop(TARGET, axis=1), np.array(dataset[TARGET])
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.33)
 
y_pred = grid_svr.best_estimator_.predict(X_test)

print('R2', grid_svr.score(X_test,y_test))

import matplotlib.pyplot as plt

z = [0,7]

plt.plot(y_test, y_pred, 'ro', z, z)
plt.xlabel('y_true')
plt.ylabel('y_pred')
plt.show()

NameError: name 'datalab1' is not defined



---



In [36]:
#@title **Random Forest Regressor**
 
from sklearn.ensemble import  RandomForestRegressor
 
# GradientBoostingRegressor / RandomForestRegressor / SVR(kernel='linear')
sel_estimator = GradientBoostingRegressor(random_state=random_state)
 
# RFE / SelectFromModel
selector = RFE(sel_estimator)
estimator = RandomForestRegressor(random_state=random_state, n_jobs=-1)
 
pipe = Pipeline([
    ('sel', selector),
    ('est', estimator)
])
 
params = {
    'sel__estimator__learning_rate': [0.05,0.1,0.2],
    'sel__n_features_to_select'    : [5],
    'est__n_estimators'            : [50,100,200,400],
    'est__criterion'               : ['mse','mae'],
    'est__max_features'            : ['auto','sqrt','log2']
}
 
grid_rfr = GridSearchCV(estimator=pipe,
                        param_grid=params,
                        scoring='r2',
                        verbose=1,
                        n_jobs=-1,
                        return_train_score=True,
                        cv=KFold(n_splits=5, shuffle=True))

NameError: name 'GradientBoostingRegressor' is not defined

datalab1

In [37]:
selected_features_rfr_1 = run_process(datalab1,grid_rfr)

NameError: name 'run_process' is not defined

In [38]:
selected_features_rfr_1 = run_process(datalab1,grid_rfr)

NameError: name 'run_process' is not defined

In [39]:
selected_features_rfr_1 = run_process(datalab1,grid_rfr)

NameError: name 'run_process' is not defined

In [40]:
selected_features_rfr_1 = run_process(datalab1,grid_rfr)

NameError: name 'run_process' is not defined

In [41]:
selected_features_rfr_1 = run_process(datalab1,grid_rfr)

NameError: name 'run_process' is not defined

In [42]:
selected_features_rfr_1 = run_process(datalab1,grid_rfr)

NameError: name 'run_process' is not defined

In [43]:
selected_features_rfr_1 = run_process(datalab1,grid_rfr)

NameError: name 'run_process' is not defined

In [44]:
selected_features_rfr_1 = run_process(datalab1,grid_rfr)

NameError: name 'run_process' is not defined

In [45]:
selected_features_rfr_1 = run_process(datalab1,grid_rfr)

NameError: name 'run_process' is not defined



---



datalab2

In [46]:
selected_features_rfr_2 = run_process(datalab2,grid_rfr)

NameError: name 'run_process' is not defined

In [47]:
selected_features_rfr_2 = run_process(datalab2,grid_rfr)

NameError: name 'run_process' is not defined

In [48]:
selected_features_rfr_2 = run_process(datalab2,grid_rfr)

NameError: name 'run_process' is not defined

In [49]:
selected_features_rfr_2 = run_process(datalab2,grid_rfr)

NameError: name 'run_process' is not defined

In [50]:
selected_features_rfr_2 = run_process(datalab2,grid_rfr)

NameError: name 'run_process' is not defined

In [51]:
selected_features_rfr_2 = run_process(datalab2,grid_rfr)

NameError: name 'run_process' is not defined

In [52]:
selected_features_rfr_2 = run_process(datalab2,grid_rfr)

NameError: name 'run_process' is not defined

In [53]:
selected_features_rfr_2 = run_process(datalab2,grid_rfr)

NameError: name 'run_process' is not defined

In [54]:
selected_features_rfr_2 = run_process(datalab2,grid_rfr)

NameError: name 'run_process' is not defined



---



datalab3

In [55]:
selected_features_rfr_3 = run_process(datalab3,grid_rfr)

NameError: name 'run_process' is not defined

In [56]:
selected_features_rfr_3 = run_process(datalab3,grid_rfr)

NameError: name 'run_process' is not defined

In [57]:
selected_features_rfr_3 = run_process(datalab3,grid_rfr)

NameError: name 'run_process' is not defined

In [58]:
selected_features_rfr_3 = run_process(datalab3,grid_rfr)

NameError: name 'run_process' is not defined

In [59]:
selected_features_rfr_3 = run_process(datalab3,grid_rfr)

NameError: name 'run_process' is not defined

In [60]:
selected_features_rfr_3 = run_process(datalab3,grid_rfr)

NameError: name 'run_process' is not defined

In [61]:
selected_features_rfr_3 = run_process(datalab3,grid_rfr)

NameError: name 'run_process' is not defined

In [62]:
selected_features_rfr_3 = run_process(datalab3,grid_rfr)

NameError: name 'run_process' is not defined

In [63]:
selected_features_rfr_3 = run_process(datalab3,grid_rfr)

NameError: name 'run_process' is not defined



---



datalab4

In [64]:
selected_features_rfr_4 = run_process(datalab4,grid_rfr)

NameError: name 'run_process' is not defined

In [65]:
selected_features_rfr_4 = run_process(datalab4,grid_rfr)

NameError: name 'run_process' is not defined

In [66]:
selected_features_rfr_4 = run_process(datalab4,grid_rfr)

NameError: name 'run_process' is not defined

In [67]:
selected_features_rfr_4 = run_process(datalab4,grid_rfr)

NameError: name 'run_process' is not defined

In [68]:
selected_features_rfr_4 = run_process(datalab4,grid_rfr)

NameError: name 'run_process' is not defined

In [69]:
selected_features_rfr_4 = run_process(datalab4,grid_rfr)

NameError: name 'run_process' is not defined

In [70]:
selected_features_rfr_4 = run_process(datalab4,grid_rfr)

NameError: name 'run_process' is not defined

In [None]:
selected_features_rfr_4 = run_process(datalab4,grid_rfr)

Fitting 5 folds for each of 72 candidates, totalling 360 fits
R2-test-fit: 0.22962021285811343
R2-test 0.12255895240539283
MSE-test 2.3181107077752965
Best params: {'est__criterion': 'mae', 'est__max_features': 'log2', 'est__n_estimators': 400, 'sel__estimator__learning_rate': 0.2, 'sel__n_features_to_select': 5}
Selected features: ['g_lab4', 'rt_lab4', 'cer_lab4', 'actq1_lab4', 'mean(qavt$_lab4)']


In [None]:
selected_features_rfr_4 = run_process(datalab4,grid_rfr)

Fitting 5 folds for each of 72 candidates, totalling 360 fits
R2-test-fit: 0.2328573698162033
R2-test 0.07285905085094702
MSE-test 2.344858178063425
Best params: {'est__criterion': 'mse', 'est__max_features': 'sqrt', 'est__n_estimators': 200, 'sel__estimator__learning_rate': 0.2, 'sel__n_features_to_select': 5}
Selected features: ['rt_lab4', 'rtr_lab4', 'cer_lab4', 'actq2_lab4', 'mean(qavt$_lab4)']




---



In [None]:
estimator = RandomForestRegressor(random_state=random_state, n_jobs=-1)
 
params = {
    'n_estimators'  : [50,100,200,400],
    'criterion'     : ['mse','mae'],
    'max_features'  : ['auto','sqrt','log2']
}
 
grid_rfr = GridSearchCV(estimator=estimator,
                        param_grid=params,
                        scoring='r2',
                        verbose=1,
                        n_jobs=-1,
                        return_train_score=True,
                        cv=KFold(n_splits=5, shuffle=True))

datalab1_2

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.06604780071295309
R2-test 0.026004780335071254
MSE-test 2.524526314360119
Best params: {'criterion': 'mse', 'max_features': 'sqrt', 'n_estimators': 400}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.08627640515217602
R2-test 0.02703867022351436
MSE-test 2.5726994944196426
Best params: {'criterion': 'mse', 'max_features': 'log2', 'n_estimators': 400}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.044900703937422626
R2-test 0.02379749008497123
MSE-test 2.814884295386905
Best params: {'criterion': 'mse', 'max_features': 'sqrt', 'n_estimators': 200}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.012245398443196432
R2-test 0.10801475843065234
MSE-test 2.0654830985863093
Best params: {'criterion': 'mae', 'max_features': 'sqrt', 'n_estimators': 400}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.07378431602592536
R2-test 0.13140791245439876
MSE-test 2.3593600357142863
Best params: {'criterion': 'mse', 'max_features': 'log2', 'n_estimators': 200}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.09630032960042967
R2-test 0.041967912360950654
MSE-test 2.568257824939599
Best params: {'criterion': 'mse', 'max_features': 'log2', 'n_estimators': 200}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.1015374122153107
R2-test 0.04347043552124441
MSE-test 2.1189285298226435
Best params: {'criterion': 'mse', 'max_features': 'log2', 'n_estimators': 100}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.12087841494931492
R2-test 0.17936315562725613
MSE-test 2.1027432218915343
Best params: {'criterion': 'mse', 'max_features': 'log2', 'n_estimators': 100}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.07467040985905342
R2-test 0.12036205639661901
MSE-test 2.622708284412203
Best params: {'criterion': 'mse', 'max_features': 'sqrt', 'n_estimators': 400}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2']

datalab1_2_3

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.147755680573684
R2-test 0.11101195775792494
MSE-test 2.1909734583333336
Best params: {'criterion': 'mse', 'max_features': 'log2', 'n_estimators': 200}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.23312196068662475
R2-test 0.16639343504648263
MSE-test 1.9574121199776782
Best params: {'criterion': 'mse', 'max_features': 'log2', 'n_estimators': 400}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.18954187908887468
R2-test 0.21518411061840093
MSE-test 1.856312866071429
Best params: {'criterion': 'mae', 'max_features': 'log2', 'n_estimators': 200}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.17872261930104313
R2-test 0.19659789986313458
MSE-test 2.0733521309523812
Best params: {'criterion': 'mae', 'max_features': 'log2', 'n_estimators': 50}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.16326078507732564
R2-test 0.1070529117568152
MSE-test 2.3454449285714283
Best params: {'criterion': 'mae', 'max_features': 'log2', 'n_estimators': 200}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.22979258141937947
R2-test 0.05450215164382566
MSE-test 2.1140117857142857
Best params: {'criterion': 'mae', 'max_features': 'auto', 'n_estimators': 50}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.2266959597065262
R2-test 0.17635329040331338
MSE-test 2.440279833333333
Best params: {'criterion': 'mae', 'max_features': 'log2', 'n_estimators': 50}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.1929070812033978
R2-test 0.07222849524853003
MSE-test 2.462800424525669
Best params: {'criterion': 'mae', 'max_features': 'auto', 'n_estimators': 400}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.22221137930537044
R2-test 0.185845476731321
MSE-test 2.4747632120535714
Best params: {'criterion': 'mse', 'max_features': 'sqrt', 'n_estimators': 200}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3']

datalab1_2_3_4

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3]).join(datalab4[selected_features_rfr_4])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.24157051987558145
R2-test 0.28403941560651547
MSE-test 2.0385483519345238
Best params: {'criterion': 'mse', 'max_features': 'sqrt', 'n_estimators': 200}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3',
 'rt_lab4',
 'rtr_lab4',
 'cer_lab4',
 'actq2_lab4',
 'mean(qavt$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3]).join(datalab4[selected_features_rfr_4])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.2385795855179619
R2-test 0.21906480046303567
MSE-test 1.8615210788690475
Best params: {'criterion': 'mse', 'max_features': 'log2', 'n_estimators': 200}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3',
 'rt_lab4',
 'rtr_lab4',
 'cer_lab4',
 'actq2_lab4',
 'mean(qavt$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3]).join(datalab4[selected_features_rfr_4])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.26342413041983814
R2-test 0.23640285688539042
MSE-test 2.224716901041667
Best params: {'criterion': 'mse', 'max_features': 'sqrt', 'n_estimators': 200}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3',
 'rt_lab4',
 'rtr_lab4',
 'cer_lab4',
 'actq2_lab4',
 'mean(qavt$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3]).join(datalab4[selected_features_rfr_4])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.24383929926131126
R2-test 0.3592372346008387
MSE-test 1.6555896383928579
Best params: {'criterion': 'mse', 'max_features': 'sqrt', 'n_estimators': 400}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3',
 'rt_lab4',
 'rtr_lab4',
 'cer_lab4',
 'actq2_lab4',
 'mean(qavt$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3]).join(datalab4[selected_features_rfr_4])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.27462749202242304
R2-test 0.2864586534738772
MSE-test 1.9060561703869052
Best params: {'criterion': 'mse', 'max_features': 'sqrt', 'n_estimators': 400}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3',
 'rt_lab4',
 'rtr_lab4',
 'cer_lab4',
 'actq2_lab4',
 'mean(qavt$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3]).join(datalab4[selected_features_rfr_4])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.23339601674518978
R2-test 0.16670798002677523
MSE-test 2.1195481071428572
Best params: {'criterion': 'mse', 'max_features': 'sqrt', 'n_estimators': 50}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3',
 'rt_lab4',
 'rtr_lab4',
 'cer_lab4',
 'actq2_lab4',
 'mean(qavt$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3]).join(datalab4[selected_features_rfr_4])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.2245456730943573
R2-test 0.3165732191338049
MSE-test 1.9219487068452379
Best params: {'criterion': 'mse', 'max_features': 'sqrt', 'n_estimators': 400}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3',
 'rt_lab4',
 'rtr_lab4',
 'cer_lab4',
 'actq2_lab4',
 'mean(qavt$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3]).join(datalab4[selected_features_rfr_4])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.25409295192745696
R2-test 0.14114809115218596
MSE-test 1.8609197470238104
Best params: {'criterion': 'mse', 'max_features': 'log2', 'n_estimators': 100}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3',
 'rt_lab4',
 'rtr_lab4',
 'cer_lab4',
 'actq2_lab4',
 'mean(qavt$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_rfr_1].join(datalab2[selected_features_rfr_2]).join(datalab3[selected_features_rfr_3]).join(datalab4[selected_features_rfr_4])
run_process(dataset,grid_rfr)

Fitting 5 folds for each of 24 candidates, totalling 120 fits
R2-test-fit: 0.22610258825938678
R2-test 0.29629842289854136
MSE-test 1.81886213374256
Best params: {'criterion': 'mse', 'max_features': 'log2', 'n_estimators': 400}


['rtr_lab1',
 'actq1_lab1',
 'actq3_lab1',
 'mean(qmsr$_lab1)',
 'mean(qc$_lab1)',
 'ut_lab2',
 'act_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'act_lab3',
 'rt_lab3',
 'rtr_lab3',
 'cer_lab3',
 'actq2_lab3',
 'rt_lab4',
 'rtr_lab4',
 'cer_lab4',
 'actq2_lab4',
 'mean(qavt$_lab4)']



---



In [None]:
#@title **Linear Regression**

from sklearn.linear_model import LinearRegression
 
# GradientBoostingRegressor / RandomForestRegressor / SVR(kernel='linear')
sel_estimator = GradientBoostingRegressor(random_state=random_state)
 
# RFE / SelectFromModel
selector = RFE(sel_estimator)
estimator = LinearRegression()

pipe = Pipeline([
    ('sel', selector),
    ('est', estimator)
])
 
# params = {'est__n_jobs': [-1], 
#           'est__normalize': [True], 
#           'sel__estimator__learning_rate': [0.1], 
#           'sel__estimator__n_estimators': [100], 
#           'sel__max_features': [10], 
#           'sel__prefit': [False]}

params = {
    'sel__n_features_to_select' : [5],
    'sel__step'                 : [1,2],
    'est__n_jobs'               : [-1],
}
 
grid_lr = GridSearchCV(estimator=pipe,
                       param_grid=params,
                       scoring='r2',
                       verbose=1,
                       n_jobs=-1,
                       return_train_score=True,
                       cv=KFold(n_splits=5, shuffle=True))

In [None]:
selected_features_lr_1 = run_process(datalab1,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   12.5s finished


R2-test-fit: 0.02811225355053535
R2-test 0.032558596746795065
MSE-test 2.5196610989325885
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['ut_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)', 'avgtime_lab1']


In [None]:
selected_features_lr_1 = run_process(datalab1,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits
R2-test-fit: 0.03897143860883288
R2-test 0.004269003431778162
MSE-test 2.417052323166249
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['ctr_lab1', 'rtr_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)']


In [None]:
selected_features_lr_1 = run_process(datalab1,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits
R2-test-fit: 0.01836910463115362
R2-test -0.0351778738876205
MSE-test 2.087744784828418
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['act_lab1', 'rtr_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)', 'mean(qc$_lab1)']


In [None]:
selected_features_lr_1 = run_process(datalab1,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits
R2-test-fit: -0.016888356437965758
R2-test -0.072736786954678
MSE-test 2.3794821493071088
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['rtr_lab1', 'cer_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)']


In [None]:
selected_features_lr_1 = run_process(datalab1,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits
R2-test-fit: 0.031864327359388
R2-test -0.1664606626861289
MSE-test 2.7362078241077707
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['rt_lab1', 'ctr_lab1', 'cer_lab1', 'actq1_lab1', 'actq3_lab1']


In [None]:
selected_features_lr_1 = run_process(datalab1,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits
R2-test-fit: -0.015313234783943197
R2-test -0.02341772855642965
MSE-test 3.108214716784758
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['rt_lab1', 'ctr_lab1', 'actq1_lab1', 'actq3_lab1', 'avgtime_lab1']


In [None]:
selected_features_lr_1 = run_process(datalab1,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits
R2-test-fit: 0.0006082950578217616
R2-test -0.046412203405714836
MSE-test 2.188859717264865
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['rt_lab1', 'rtr_lab1', 'cer_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)']


In [None]:
selected_features_lr_1 = run_process(datalab1,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits
R2-test-fit: 0.01726029461881915
R2-test -0.161316514713018
MSE-test 2.583963808227975
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['ct_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qavt$_lab1)', 'mean(qmsr$_lab1)']


In [None]:
selected_features_lr_1 = run_process(datalab1,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits
R2-test-fit: -0.07246426008578868
R2-test 0.044227075998590326
MSE-test 2.421602954766893
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['cer_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)', 'mean(qc$_lab1)']


In [None]:
selected_features_lr_1 = run_process(datalab1,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits
R2-test-fit: 0.01283722159498144
R2-test -0.01219173166213916
MSE-test 2.573386661691931
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['ut_lab1', 'rtr_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)']




---



In [None]:
selected_features_lr_2 = run_process(datalab2,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   12.8s finished


R2-test-fit: -0.018461526297947884
R2-test -0.01656735636802731
MSE-test 2.728017786168922
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['actq1_lab2', 'actq3_lab2', 'mean(qact$_lab2)', 'mean(qavt$_lab2)', 'avgtime_lab2']


In [None]:
selected_features_lr_2 = run_process(datalab2,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.4s finished


R2-test-fit: -0.007773403567338933
R2-test 0.0021815699112528453
MSE-test 2.5931524128877563
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['rt_lab2', 'actq1_lab2', 'actq3_lab2', 'mean(qavt$_lab2)', 'sum(qat$_lab2)']


In [None]:
selected_features_lr_2 = run_process(datalab2,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.4s finished


R2-test-fit: -0.05430646627827982
R2-test -0.004493133035586405
MSE-test 2.2068622310502883
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['actq1_lab2', 'actq3_lab2', 'mean(qact$_lab2)', 'mean(qavt$_lab2)', 'mean(qmsr$_lab2)']


In [None]:
selected_features_lr_2 = run_process(datalab2,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.6s finished


R2-test-fit: -0.01116308943135631
R2-test -0.09358823440447739
MSE-test 2.8867796259404037
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['ct_lab2', 'rt_lab2', 'actq1_lab2', 'actq3_lab2', 'mean(qmsr$_lab2)']


In [None]:
selected_features_lr_2 = run_process(datalab2,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.5s finished


R2-test-fit: -0.1206116023011315
R2-test -0.011551057319366675
MSE-test 2.3917258136634243
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['rtr_lab2', 'actq1_lab2', 'actq3_lab2', 'mean(qact$_lab2)', 'avgtime_lab2']


In [None]:
selected_features_lr_2 = run_process(datalab2,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.4s finished


R2-test-fit: -0.02593232376933572
R2-test -0.0029205063247796925
MSE-test 2.783499546633971
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['ut_lab2', 'rt_lab2', 'actq2_lab2', 'actq3_lab2', 'avgtime_lab2']


In [None]:
selected_features_lr_2 = run_process(datalab2,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.5s finished


R2-test-fit: -0.05192043074153698
R2-test -0.048880376819264715
MSE-test 2.768709730396985
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['rt_lab2', 'rtr_lab2', 'actq1_lab2', 'mean(qavt$_lab2)', 'mean(qc$_lab2)']


In [None]:
selected_features_lr_2 = run_process(datalab2,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.6s finished


R2-test-fit: -0.0714844975712177
R2-test -0.055959025146244956
MSE-test 2.8695866093217424
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['rtr_lab2', 'actq1_lab2', 'actq3_lab2', 'mean(qavt$_lab2)', 'avgtime_lab2']


In [None]:
selected_features_lr_2 = run_process(datalab2,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.5s finished


R2-test-fit: -0.0651951168662043
R2-test -0.01142981763075124
MSE-test 2.5371307013634965
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['ct_lab2', 'rt_lab2', 'actq3_lab2', 'mean(qavt$_lab2)', 'mean(qmsr$_lab2)']


In [None]:
selected_features_lr_2 = run_process(datalab2,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.4s finished


R2-test-fit: 0.003965659978402014
R2-test -0.08150860925278214
MSE-test 2.5136932429176713
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['act_lab2', 'actq1_lab2', 'actq3_lab2', 'mean(qmsr$_lab2)', 'avgtime_lab2']




---



In [None]:
selected_features_lr_3 = run_process(datalab3,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   12.3s finished


R2-test-fit: -0.018753894671260762
R2-test -0.036618679024586376
MSE-test 2.193674863056382
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['ut_lab3', 'act_lab3', 'rt_lab3', 'actq1_lab3', 'mean(qc$_lab3)']


In [None]:
selected_features_lr_3 = run_process(datalab3,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.0s finished


R2-test-fit: -0.004440166709342819
R2-test 0.07991681328798839
MSE-test 2.146431435960078
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['ut_lab3', 'rt_lab3', 'actq1_lab3', 'mean(qact$_lab3)', 'avgtime_lab3']


In [None]:
selected_features_lr_3 = run_process(datalab3,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.1s finished


R2-test-fit: 0.08125987552270511
R2-test 0.02573825965896326
MSE-test 2.117440735447757
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['ut_lab3', 'rt_lab3', 'cer_lab3', 'actq1_lab3', 'mean(qmsr$_lab3)']


In [None]:
selected_features_lr_3 = run_process(datalab3,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.0s finished


R2-test-fit: 0.019140204136254724
R2-test 0.008802314475705342
MSE-test 2.6665279223885143
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['ut_lab3', 'act_lab3', 'rt_lab3', 'err_lab3', 'actq1_lab3']


In [None]:
selected_features_lr_3 = run_process(datalab3,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.2s finished


R2-test-fit: 0.04813360498324746
R2-test -0.09553660911426132
MSE-test 2.561914534097449
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['ut_lab3', 'rt_lab3', 'cer_lab3', 'actq1_lab3', 'mean(qact$_lab3)']


In [None]:
selected_features_lr_3 = run_process(datalab3,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.1s finished


R2-test-fit: 0.049884782524431494
R2-test -0.17097118403651224
MSE-test 2.7892198376738415
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['ut_lab3', 'act_lab3', 'rt_lab3', 'rtr_lab3', 'actq1_lab3']


In [None]:
selected_features_lr_3 = run_process(datalab3,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.1s finished


R2-test-fit: 0.07901984112542626
R2-test 0.09808442468200484
MSE-test 2.466566218560531
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['rt_lab3', 'cer_lab3', 'actq1_lab3', 'mean(qavt$_lab3)', 'avgtime_lab3']


In [None]:
selected_features_lr_3 = run_process(datalab3,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.2s finished


R2-test-fit: 0.0156938361456719
R2-test 0.24565067450876066
MSE-test 2.1057344436146046
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['g_lab3', 'rt_lab3', 'actq2_lab3', 'mean(qact$_lab3)', 'mean(qmsr$_lab3)']


In [None]:
selected_features_lr_3 = run_process(datalab3,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.1s finished


R2-test-fit: 0.06193559239384365
R2-test 0.14678473679200843
MSE-test 2.2711414959040277
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['ut_lab3', 'rt_lab3', 'err_lab3', 'actq1_lab3', 'avgtime_lab3']


In [None]:
selected_features_lr_3 = run_process(datalab3,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.2s finished


R2-test-fit: 0.09405118309763708
R2-test -0.0868456089935159
MSE-test 3.0897005932879864
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['ut_lab3', 'cer_lab3', 'actq1_lab3', 'max(qat$_lab3)', 'mean(qact$_lab3)']




---



In [None]:
selected_features_lr_4 = run_process(datalab4,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   11.8s finished


R2-test-fit: 0.10961748103163853
R2-test -0.08406250297935403
MSE-test 2.714640536686722
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['g_lab4', 'rt_lab4', 'rtr_lab4', 'err_lab4', 'mean(qmsr$_lab4)']


In [None]:
selected_features_lr_4 = run_process(datalab4,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   10.6s finished


R2-test-fit: 0.02417530486505002
R2-test 0.047913569472122
MSE-test 2.2944419405263337
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['norm_log(dis_lab4)', 'rt_lab4', 'rtr_lab4', 'err_lab4', 'actq2_lab4']


In [None]:
selected_features_lr_4 = run_process(datalab4,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   10.4s finished


R2-test-fit: 0.14429264908363348
R2-test 0.17428692006586963
MSE-test 1.9188218608654248
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['g_lab4', 'rt_lab4', 'err_lab4', 'cer_lab4', 'actq1_lab4']


In [None]:
selected_features_lr_4 = run_process(datalab4,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   10.4s finished


R2-test-fit: 0.04990210003970279
R2-test 0.1631059458143865
MSE-test 2.4667674636059678
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['rt_lab4', 'cer_lab4', 'actq1_lab4', 'mean(qavt$_lab4)', 'sum(qat$_lab4)']


In [None]:
selected_features_lr_4 = run_process(datalab4,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   10.5s finished


R2-test-fit: 0.07181582605790733
R2-test 0.04539439920541622
MSE-test 2.4541102523239036
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['act_lab4', 'rt_lab4', 'cer_lab4', 'actq1_lab4', 'mean(qc$_lab4)']


In [None]:
selected_features_lr_4 = run_process(datalab4,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   10.6s finished


R2-test-fit: 0.1378296418697363
R2-test 0.040238021597752915
MSE-test 1.9367207124060317
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['g_lab4', 'rt_lab4', 'cer_lab4', 'mean(qavt$_lab4)', 'mean(qc$_lab4)']


In [None]:
selected_features_lr_4 = run_process(datalab4,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   10.5s finished


R2-test-fit: 0.17125830229583766
R2-test 0.18716368014853402
MSE-test 1.9397974171929793
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['rt_lab4', 'rtr_lab4', 'err_lab4', 'cer_lab4', 'actq1_lab4']


In [None]:
selected_features_lr_4 = run_process(datalab4,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   10.5s finished


R2-test-fit: 0.15394968300004638
R2-test 0.22039316218095983
MSE-test 2.113539715414571
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['rt_lab4', 'rtr_lab4', 'err_lab4', 'cer_lab4', 'mean(qc$_lab4)']


In [None]:
selected_features_lr_4 = run_process(datalab4,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   10.6s finished


R2-test-fit: -0.0032660208455336237
R2-test 0.17636202791941824
MSE-test 2.0575015829340364
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 2}
Selected features: ['g_lab4', 'act_lab4', 'actq1_lab4', 'mean(qmsr$_lab4)', 'mean(qc$_lab4)']


In [None]:
selected_features_lr_4 = run_process(datalab4,grid_lr)

Fitting 5 folds for each of 2 candidates, totalling 10 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done  10 out of  10 | elapsed:   10.7s finished


R2-test-fit: 0.13889850176655444
R2-test 0.16683914167981564
MSE-test 2.084583581546277
Best params: {'est__n_jobs': -1, 'sel__n_features_to_select': 5, 'sel__step': 1}
Selected features: ['rt_lab4', 'err_lab4', 'cer_lab4', 'actq1_lab4', 'mean(qc$_lab4)']




---



In [None]:
estimator = LinearRegression()
 
params = {
    'n_jobs'    : [-1],
}
 
grid_lr = GridSearchCV(estimator=estimator,
                       param_grid=params,
                       scoring='r2',
                       verbose=1,
                       n_jobs=-1,
                       return_train_score=True,
                       cv=KFold(n_splits=5, shuffle=True))

In [None]:
selected_features_lr_1 = ['actq3_lab1','actq1_lab1','mean(qmsr$_lab1)','rtr_lab1','cer_lab1']
selected_features_lr_2 = ['actq3_lab2','actq1_lab2','mean(qavt$_lab2)','avgtime_lab2','rt_lab2']
selected_features_lr_3 = ['rt_lab3','actq1_lab3','ut_lab3','mean(qact$_lab3)','cer_lab3']
selected_features_lr_4 = ['rt_lab4','cer_lab4','err_lab4','actq1_lab4','mean(qc$_lab4)']

1_2

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.


R2-test-fit: 0.006911971881848245
R2-test -0.036086090944452476
MSE-test 2.317345083670907
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    1.2s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: -0.003540234460532088
R2-test 0.0794383847029313
MSE-test 2.5780813366497703
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: -0.046590123398674944
R2-test -0.09455756729624443
MSE-test 3.0911462928259437
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.01494113936741721
R2-test -0.013487881409562696
MSE-test 2.413164056043086
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: -0.029978878483077166
R2-test -0.09356225342973579
MSE-test 2.5596454965971103
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.


R2-test-fit: -0.02061660725764882
R2-test -0.2912312061511111
MSE-test 3.081248045059268
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.


R2-test-fit: 0.026025901495438774
R2-test -0.011473874863089595
MSE-test 2.650700890786687
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.


R2-test-fit: -0.009699739648013295
R2-test 0.08507543469984125
MSE-test 2.1607507383692717
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


R2-test-fit: -0.068743834194177
R2-test 0.008960301171420104
MSE-test 2.4510015730681665
Best params: {'n_jobs': -1}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


R2-test-fit: 0.0009485423355833023
R2-test -0.13710154890430148
MSE-test 2.5407108704484296
Best params: {'n_jobs': -1}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']



---



1_2_3

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.07280532021956979
R2-test 0.12141717161565224
MSE-test 2.3262559793782014
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 5.830295615796288e-05
R2-test 0.012427536060766076
MSE-test 2.4140726711615565
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.044320763610744794
R2-test 0.06863106085845805
MSE-test 2.2071133914849135
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: -0.012095135878418373
R2-test -0.10484859642135258
MSE-test 2.7897000371370266
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: -0.004509247793069604
R2-test 0.08611742188209426
MSE-test 2.382789514680097
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: -0.03789042601758361
R2-test -0.13072142250733276
MSE-test 2.775054141731726
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.036234337665218705
R2-test 0.01943093799897322
MSE-test 2.4445363669576685
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.004192329211226786
R2-test 0.016468642925129506
MSE-test 2.175581885746646
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


R2-test-fit: 0.03902897311234281
R2-test -0.06618909207438994
MSE-test 2.9331634819395886
Best params: {'n_jobs': -1}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


R2-test-fit: 0.0742841863991344
R2-test 0.03739365033290498
MSE-test 2.413619461558209
Best params: {'n_jobs': -1}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']



---



1_2_3_4

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3]).join(datalab4[selected_features_lr_4])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.07159460170533863
R2-test 0.17405937131044213
MSE-test 1.942184873533853
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3]).join(datalab4[selected_features_lr_4])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.13712423030689774
R2-test 0.19019282289091122
MSE-test 2.20798787288616
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3]).join(datalab4[selected_features_lr_4])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.08485515397573942
R2-test 0.17004986401493094
MSE-test 2.0482862947366565
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3]).join(datalab4[selected_features_lr_4])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.2006250060442661
R2-test 0.11536931211314372
MSE-test 2.4023173759908745
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3]).join(datalab4[selected_features_lr_4])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.


R2-test-fit: 0.0876863296626134
R2-test 0.2095709912800927
MSE-test 1.6182577664266673
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3]).join(datalab4[selected_features_lr_4])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.1385503411617526
R2-test 0.1291393993575488
MSE-test 2.26177499844272
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3]).join(datalab4[selected_features_lr_4])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.11783198781579604
R2-test 0.028345362118560424
MSE-test 2.0877971158508193
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3]).join(datalab4[selected_features_lr_4])
run_process(dataset,grid_lr)

[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.


Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.15218574347801778
R2-test 0.1447160780650525
MSE-test 1.912049268903947
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3]).join(datalab4[selected_features_lr_4])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.19765417482762362
R2-test 0.0964875192844028
MSE-test 2.4087222095500955
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_lr_1].join(datalab2[selected_features_lr_2]).join(datalab3[selected_features_lr_3]).join(datalab4[selected_features_lr_4])
run_process(dataset,grid_lr)

Fitting 5 folds for each of 1 candidates, totalling 5 fits
R2-test-fit: 0.13475044609413206
R2-test -0.051569875496652706
MSE-test 2.661000476068511
Best params: {'n_jobs': -1}


[Parallel(n_jobs=-1)]: Using backend LokyBackend with 2 concurrent workers.
[Parallel(n_jobs=-1)]: Done   5 out of   5 | elapsed:    0.0s finished


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']



---



In [None]:
!apt-get install swig -y
!pip install Cython numpy
!pip install auto-sklearn

In [None]:
!pip install scikit-learn==0.23.0

In [None]:
!pip install dask distributed

In [None]:
#@title **ANN**

import keras
from keras.models import Sequential
from keras.layers import Dense
from keras.layers.core import Dense, Dropout, Flatten
from keras.optimizers import SGD
from keras.layers import Dropout
from keras.wrappers.scikit_learn import KerasRegressor
from sklearn.model_selection import RandomizedSearchCV

def create_model( nl1=1, nl2=1,  nl3=1, 
                 nn1=1000, nn2=500, nn3 = 200, lr=0.01, decay=0., l1=0.01, l2=0.01,
                act = 'relu', dropout=0, input_shape=25, output_shape=1):
    '''This is a model generating function so that we can search over neural net 
    parameters and architecture'''
    
    opt = 'SGD' # keras.optimizers.Adam(lr=lr, beta_1=0.9, beta_2=0.999,  decay=decay)
    reg = keras.regularizers.l1_l2(l1=l1, l2=l2)
                                                     
    model = Sequential()
    
    # for the firt layer we need to specify the input dimensions
    first=True
    
    for i in range(nl1):
        if first:
            model.add(Dense(nn1, input_dim=input_shape, activation=act, kernel_regularizer=reg))
            first=False
        else: 
            model.add(Dense(nn1, activation=act, kernel_regularizer=reg))
        if dropout!=0:
            model.add(Dropout(dropout))
            
    for i in range(nl2):
        if first:
            model.add(Dense(nn2, input_dim=input_shape, activation=act, kernel_regularizer=reg))
            first=False
        else: 
            model.add(Dense(nn2, activation=act, kernel_regularizer=reg))
        if dropout!=0:
            model.add(Dropout(dropout))
            
    for i in range(nl3):
        if first:
            model.add(Dense(nn3, input_dim=input_shape, activation=act, kernel_regularizer=reg))
            first=False
        else: 
            model.add(Dense(nn3, activation=act, kernel_regularizer=reg))
        if dropout!=0:
            model.add(Dropout(dropout))
            
    model.add(Dense(output_shape, activation='sigmoid'))
    model.compile(loss='mse', optimizer=opt, metrics=['mse'],)
    return model

# model class to use in the scikit random search CV 
model = KerasRegressor(build_fn=create_model, epochs=20, batch_size=20, verbose=1)

# learning algorithm parameters
lr=[1e-2, 1e-3, 1e-4]
decay=[1e-6,1e-9,0]

# activation
activation=['relu', 'sigmoid']

# numbers of layers
nl1 = [0,1,2,3]
nl2 = [0,1,2,3]
nl3 = [0,1,2,3]

# neurons in each layer
nn1=[20,50,100]
nn2=[10,40,70]
nn3=[5,15,30]
# nn1=[300,700,1400,2100]
# nn2=[100,400,800]
# nn3=[50,150,300]

# dropout and regularisation
dropout = [0, 0.1, 0.2, 0.3]
l1 = [0, 0.01, 0.003, 0.001, 0.0001]
l2 = [0, 0.01, 0.003, 0.001, 0.0001]

In [None]:
# GradientBoostingRegressor / RandomForestRegressor / SVR(kernel='linear')
sel_estimator = GradientBoostingRegressor(random_state=random_state)
 
# RFE / SelectFromModel
selector = RFE(sel_estimator)
estimator = model
 
pipe = Pipeline([
    ('sel', selector),
    ('est', estimator)
])

param_grid = {
    'sel__estimator__learning_rate': [0.05,0.1,0.2],
    'sel__n_features_to_select'    : [5],
    'est__nl1':            nl1,
    'est__nl2':            nl2,
    'est__nl3':            nl3,
    'est__nn1':            nn1,
    'est__nn2':            nn2,
    'est__nn3':            nn3,
    'est__act':            activation,
    'est__l1':             l1,
    'est__l2':             l2,
    'est__lr':             lr,
    'est__decay':          decay,
    'est__dropout':        dropout, 
    'est__input_shape':    [5],
    'est__output_shape':   [1]
}

rand_cv = RandomizedSearchCV(estimator=pipe,
                             param_distributions=param_grid,
                             verbose=100,
                             n_iter=10,
                             scoring='neg_mean_squared_error',
                             n_jobs=-1,
                             return_train_score=True,
                             cv=KFold(n_splits=5, shuffle=True))

In [None]:
run_process(datalab1, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.923303439476626
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.056368827819824
MSE-test 6.411592354201742
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 40, 'est__nn1': 50, 'est__nl3': 1, 'est__nl2': 3, 'est__nl1': 2, 'est__lr': 0.001, 'est__l2': 0.003, 'est__l1': 0, 'est__input_shape': 5, 'est__dropout': 0, 'est__decay': 1e-06, 'est__act': 'relu'}
Selected features: ['ut_lab1', 'rtr_lab1', 'actq1_lab1', 

['ut_lab1', 'rtr_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qc$_lab1)']

In [None]:
run_process(datalab1, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9258554070201
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.106952667236328
MSE-test 6.644561882162838
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 10, 'est__nn1': 20, 'est__nl3': 2, 'est__nl2': 2, 'est__nl1': 2, 'est__lr': 0.01, 'est__l2': 0.001, 'est__l1': 0.001, 'est__input_shape': 5, 'est__dropout': 0.1, 'est__decay': 1e-06, 'est__act': 'relu'}
Selected features: ['ut_lab1', 'ctr_lab1', 'actq1_lab1

['ut_lab1', 'ctr_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)']

In [None]:
run_process(datalab1, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.936426645465245
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -10.874432563781738
MSE-test 5.652118969822092
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.05, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 70, 'est__nn1': 20, 'est__nl3': 3, 'est__nl2': 1, 'est__nl1': 0, 'est__lr': 0.001, 'est__l2': 0.0001, 'est__l1': 0.01, 'est__input_shape': 5, 'est__dropout': 0.1, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['ctr_lab1', 'cer_lab1', 'actq

['ctr_lab1', 'cer_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)']

In [None]:
run_process(datalab1, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.927009356216222
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.854718208312988
MSE-test 6.558102731570438
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 5, 'est__nn2': 40, 'est__nn1': 20, 'est__nl3': 1, 'est__nl2': 2, 'est__nl1': 2, 'est__lr': 0.001, 'est__l2': 0.003, 'est__l1': 0, 'est__input_shape': 5, 'est__dropout': 0.1, 'est__decay': 1e-06, 'est__act': 'relu'}
Selected features: ['ut_lab1', 'rt_lab1', 'actq1_lab1', 

['ut_lab1', 'rt_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)']

In [None]:
run_process(datalab1, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.918343879459089
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -11.860539436340332
MSE-test 6.010468995425837
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.05, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 40, 'est__nn1': 100, 'est__nl3': 1, 'est__nl2': 3, 'est__nl1': 2, 'est__lr': 0.001, 'est__l2': 0.001, 'est__l1': 0.003, 'est__input_shape': 5, 'est__dropout': 0, 'est__decay': 1e-06, 'est__act': 'relu'}
Selected features: ['ctr_lab1', 'actq1_lab1', 'act

['ctr_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)', 'sum(qat$_lab1)']

In [None]:
run_process(datalab1, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.933888879874241
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -21.48423194885254
MSE-test 5.708795652634326
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 40, 'est__nn1': 100, 'est__nl3': 0, 'est__nl2': 3, 'est__nl1': 2, 'est__lr': 0.001, 'est__l2': 0.01, 'est__l1': 0.01, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 1e-09, 'est__act': 'sigmoid'}
Selected features: ['rtr_lab1', 'actq1_lab1', 'ac

['rtr_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)', 'sum(qat$_lab1)']

In [None]:
run_process(datalab1, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.929686239745116
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.813991546630859
MSE-test 6.253539401301734
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 10, 'est__nn1': 50, 'est__nl3': 3, 'est__nl2': 1, 'est__nl1': 2, 'est__lr': 0.01, 'est__l2': 0, 'est__l1': 0.001, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 0, 'est__act': 'relu'}
Selected features: ['ctr_lab1', 'rtr_lab1', 'cer_lab1', 'act

['ctr_lab1', 'rtr_lab1', 'cer_lab1', 'actq1_lab1', 'actq3_lab1']

In [None]:
run_process(datalab1, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.925605766693848
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.979732036590576
MSE-test 5.982978865412167
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 10, 'est__nn1': 50, 'est__nl3': 2, 'est__nl2': 3, 'est__nl1': 0, 'est__lr': 0.01, 'est__l2': 0.003, 'est__l1': 0.003, 'est__input_shape': 5, 'est__dropout': 0, 'est__decay': 0, 'est__act': 'relu'}
Selected features: ['rtr_lab1', 'cer_lab1', 'actq1_lab1', 

['rtr_lab1', 'cer_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)']

In [None]:
run_process(datalab1, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.916838894362114
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -8.500391960144043
MSE-test 7.207648012376789
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 70, 'est__nn1': 50, 'est__nl3': 3, 'est__nl2': 3, 'est__nl1': 2, 'est__lr': 0.01, 'est__l2': 0.003, 'est__l1': 0.0001, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['ut_lab1', 'ct_lab1', 'rt_lab1'

['ut_lab1', 'ct_lab1', 'rt_lab1', 'actq1_lab1', 'actq3_lab1']

In [None]:
run_process(datalab1, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9228367533459965
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.965287208557129
MSE-test 6.555714213191168
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 40, 'est__nn1': 100, 'est__nl3': 2, 'est__nl2': 3, 'est__nl1': 3, 'est__lr': 0.001, 'est__l2': 0.001, 'est__l1': 0, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 1e-06, 'est__act': 'relu'}
Selected features: ['rt_lab1', 'rtr_lab1', 'actq1_lab

['rt_lab1', 'rtr_lab1', 'actq1_lab1', 'actq3_lab1', 'mean(qmsr$_lab1)']



---



In [None]:
run_process(datalab2, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.912453406891068
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.445986270904541
MSE-test 5.847026207373182
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 70, 'est__nn1': 100, 'est__nl3': 3, 'est__nl2': 3, 'est__nl1': 0, 'est__lr': 0.01, 'est__l2': 0.0001, 'est__l1': 0.001, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 1e-06, 'est__act': 'relu'}
Selected features: ['ut_lab2', 'actq1_lab2', 'actq

['ut_lab2', 'actq1_lab2', 'actq3_lab2', 'mean(qact$_lab2)', 'avgtime_lab2']

In [None]:
run_process(datalab2, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.917384506622694
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.697447776794434
MSE-test 6.875908767372708
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 5, 'est__nn2': 40, 'est__nn1': 50, 'est__nl3': 2, 'est__nl2': 0, 'est__nl1': 3, 'est__lr': 0.001, 'est__l2': 0.001, 'est__l1': 0.001, 'est__input_shape': 5, 'est__dropout': 0.1, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['ut_lab2', 'ctr_lab2', 'actq1_la

['ut_lab2', 'ctr_lab2', 'actq1_lab2', 'actq3_lab2', 'mean(qmsr$_lab2)']

In [None]:
run_process(datalab2, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.93834031128469
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -10.449772834777832
MSE-test 5.605559808154102
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 5, 'est__nn2': 70, 'est__nn1': 50, 'est__nl3': 3, 'est__nl2': 2, 'est__nl1': 3, 'est__lr': 0.001, 'est__l2': 0.001, 'est__l1': 0.003, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 0, 'est__act': 'relu'}
Selected features: ['act_lab2', 'actq1_lab2', 'actq3_lab

['act_lab2', 'actq1_lab2', 'actq3_lab2', 'mean(qavt$_lab2)', 'avgtime_lab2']

In [None]:
run_process(datalab2, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9231076530314555
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.350379467010498
MSE-test 5.503988235865399
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.05, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 10, 'est__nn1': 20, 'est__nl3': 3, 'est__nl2': 3, 'est__nl1': 3, 'est__lr': 0.001, 'est__l2': 0.0001, 'est__l1': 0.003, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['actq1_lab2', 'actq3_lab2', 

['actq1_lab2',
 'actq3_lab2',
 'mean(qact$_lab2)',
 'max(qme$_lab2)',
 'avgtime_lab2']

In [None]:
run_process(datalab2, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9332081344107435
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -8.12122917175293
MSE-test 4.969773375214392
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 70, 'est__nn1': 20, 'est__nl3': 2, 'est__nl2': 2, 'est__nl1': 0, 'est__lr': 0.001, 'est__l2': 0.01, 'est__l1': 0.003, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 0, 'est__act': 'relu'}
Selected features: ['ut_lab2', 'rtr_lab2', 'actq1_lab2',

['ut_lab2', 'rtr_lab2', 'actq1_lab2', 'actq3_lab2', 'mean(qavt$_lab2)']

In [None]:
run_process(datalab2, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.921892392514841
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.015786170959473
MSE-test 6.01578594276469
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.05, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 10, 'est__nn1': 50, 'est__nl3': 2, 'est__nl2': 0, 'est__nl1': 2, 'est__lr': 0.0001, 'est__l2': 0, 'est__l1': 0, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 0, 'est__act': 'relu'}
Selected features: ['ct_lab2', 'rtr_lab2', 'actq1_lab2', 'actq

['ct_lab2', 'rtr_lab2', 'actq1_lab2', 'actq3_lab2', 'avgtime_lab2']

In [None]:
run_process(datalab2, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.919988275213578
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.937684535980225
MSE-test 6.389940125838646
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.05, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 40, 'est__nn1': 50, 'est__nl3': 3, 'est__nl2': 0, 'est__nl1': 1, 'est__lr': 0.01, 'est__l2': 0.0001, 'est__l1': 0.001, 'est__input_shape': 5, 'est__dropout': 0, 'est__decay': 0, 'est__act': 'relu'}
Selected features: ['rt_lab2', 'actq2_lab2', 'actq3_lab2

['rt_lab2', 'actq2_lab2', 'actq3_lab2', 'max(qat$_lab2)', 'avgtime_lab2']

In [None]:
run_process(datalab2, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9256723894232675
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.306046962738037
MSE-test 5.589627618331404
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 5, 'est__nn2': 70, 'est__nn1': 100, 'est__nl3': 0, 'est__nl2': 3, 'est__nl1': 1, 'est__lr': 0.001, 'est__l2': 0.0001, 'est__l1': 0.001, 'est__input_shape': 5, 'est__dropout': 0.1, 'est__decay': 0, 'est__act': 'sigmoid'}
Selected features: ['ct_lab2', 'err_lab2', 'actq1_

['ct_lab2', 'err_lab2', 'actq1_lab2', 'mean(qavt$_lab2)', 'avgtime_lab2']

In [None]:
run_process(datalab2, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.908403679619407
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.253237247467041
MSE-test 6.232684761993369
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.05, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 70, 'est__nn1': 20, 'est__nl3': 3, 'est__nl2': 3, 'est__nl1': 0, 'est__lr': 0.0001, 'est__l2': 0.0001, 'est__l1': 0, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 1e-06, 'est__act': 'relu'}
Selected features: ['act_lab2', 'rtr_lab2', 'actq1_l

['act_lab2', 'rtr_lab2', 'actq1_lab2', 'mean(qavt$_lab2)', 'avgtime_lab2']

In [None]:
run_process(datalab2, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9206813617931955
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.365689277648926
MSE-test 5.1888011969991945
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 40, 'est__nn1': 20, 'est__nl3': 0, 'est__nl2': 3, 'est__nl1': 1, 'est__lr': 0.01, 'est__l2': 0.001, 'est__l1': 0.0001, 'est__input_shape': 5, 'est__dropout': 0.1, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['ut_lab2', 'act_lab2', 'actq3

['ut_lab2', 'act_lab2', 'actq3_lab2', 'mean(qmsr$_lab2)', 'avgtime_lab2']



---



In [None]:
run_process(datalab3, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.920140462853393
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.531270503997803
MSE-test 4.821540572510062
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 70, 'est__nn1': 20, 'est__nl3': 0, 'est__nl2': 3, 'est__nl1': 2, 'est__lr': 0.001, 'est__l2': 0.003, 'est__l1': 0.0001, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 0, 'est__act': 'sigmoid'}
Selected features: ['ut_lab3', 'act_lab3', 'rt_lab3

['ut_lab3', 'act_lab3', 'rt_lab3', 'actq2_lab3', 'avgtime_lab3']

In [None]:
run_process(datalab3, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.913329034622601
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.094500541687012
MSE-test 5.5303557567620425
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 40, 'est__nn1': 50, 'est__nl3': 3, 'est__nl2': 0, 'est__nl1': 1, 'est__lr': 0.01, 'est__l2': 0.0001, 'est__l1': 0.003, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['act_lab3', 'rt_lab3', 'cer_la

['act_lab3', 'rt_lab3', 'cer_lab3', 'mean(qc$_lab3)', 'avgtime_lab3']

In [None]:
run_process(datalab3, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.929269555439978
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.7596755027771
MSE-test 5.8206793748908385
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.05, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 70, 'est__nn1': 20, 'est__nl3': 2, 'est__nl2': 2, 'est__nl1': 0, 'est__lr': 0.0001, 'est__l2': 0, 'est__l1': 0.001, 'est__input_shape': 5, 'est__dropout': 0.1, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['g_lab3', 'ut_lab3', 'act_lab3', '

['g_lab3', 'ut_lab3', 'act_lab3', 'actq3_lab3', 'avgtime_lab3']

In [None]:
run_process(datalab3, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9224593840366655
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.94298791885376
MSE-test 6.90213427440068
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 40, 'est__nn1': 50, 'est__nl3': 0, 'est__nl2': 0, 'est__nl1': 2, 'est__lr': 0.0001, 'est__l2': 0.0001, 'est__l1': 0.0001, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 0, 'est__act': 'sigmoid'}
Selected features: ['ut_lab3', 'act_lab3', 'rt_lab

['ut_lab3', 'act_lab3', 'rt_lab3', 'actq1_lab3', 'sum(qat$_lab3)']

In [None]:
run_process(datalab3, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9040772714912
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.857508182525635
MSE-test 5.822901760813015
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 40, 'est__nn1': 100, 'est__nl3': 2, 'est__nl2': 2, 'est__nl1': 3, 'est__lr': 0.01, 'est__l2': 0.0001, 'est__l1': 0, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['ut_lab3', 'act_lab3', 'rt_lab3', 'a

['ut_lab3', 'act_lab3', 'rt_lab3', 'actq1_lab3', 'actq3_lab3']

In [None]:
run_process(datalab3, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.929092788896574
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.519593715667725
MSE-test 6.442246311845945
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 40, 'est__nn1': 50, 'est__nl3': 0, 'est__nl2': 0, 'est__nl1': 3, 'est__lr': 0.001, 'est__l2': 0.0001, 'est__l1': 0.0001, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 1e-06, 'est__act': 'relu'}
Selected features: ['ut_lab3', 'rt_lab3', 'cer_la

['ut_lab3', 'rt_lab3', 'cer_lab3', 'actq2_lab3', 'avgtime_lab3']

In [None]:
run_process(datalab3, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9184795171642115
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.730086803436279
MSE-test 5.456266632447529
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 5, 'est__nn2': 40, 'est__nn1': 100, 'est__nl3': 0, 'est__nl2': 2, 'est__nl1': 3, 'est__lr': 0.0001, 'est__l2': 0.0001, 'est__l1': 0.0001, 'est__input_shape': 5, 'est__dropout': 0.1, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['ut_lab3', 'rt_lab3', 'cer_

['ut_lab3', 'rt_lab3', 'cer_lab3', 'actq1_lab3', 'mean(qact$_lab3)']

In [None]:
run_process(datalab3, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9203510092908065
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.979729175567627
MSE-test 6.372183181067639
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 70, 'est__nn1': 50, 'est__nl3': 3, 'est__nl2': 3, 'est__nl1': 0, 'est__lr': 0.01, 'est__l2': 0.0001, 'est__l1': 0.001, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 0, 'est__act': 'relu'}
Selected features: ['g_lab3', 'ut_lab3', 'act_lab3', '

['g_lab3', 'ut_lab3', 'act_lab3', 'rtr_lab3', 'actq1_lab3']

In [None]:
run_process(datalab3, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.926707916778894
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.962094306945801
MSE-test 5.898590205641643
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.05, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 40, 'est__nn1': 20, 'est__nl3': 0, 'est__nl2': 2, 'est__nl1': 3, 'est__lr': 0.001, 'est__l2': 0.0001, 'est__l1': 0.0001, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 0, 'est__act': 'sigmoid'}
Selected features: ['ut_lab3', 'cer_lab3', 'actq1

['ut_lab3', 'cer_lab3', 'actq1_lab3', 'mean(qact$_lab3)', 'avgtime_lab3']

In [None]:
run_process(datalab3, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.927691035297036
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.402716636657715
MSE-test 6.313315179470624
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.05, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 40, 'est__nn1': 20, 'est__nl3': 2, 'est__nl2': 3, 'est__nl1': 3, 'est__lr': 0.0001, 'est__l2': 0, 'est__l1': 0.0001, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 0, 'est__act': 'relu'}
Selected features: ['g_lab3', 'ut_lab3', 'act_lab3', 'ac

['g_lab3', 'ut_lab3', 'act_lab3', 'actq2_lab3', 'actq3_lab3']



---



In [None]:
run_process(datalab4, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.924451904583831
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.738160133361816
MSE-test 5.610004427353571
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 10, 'est__nn1': 50, 'est__nl3': 3, 'est__nl2': 2, 'est__nl1': 0, 'est__lr': 0.0001, 'est__l2': 0.001, 'est__l1': 0.0001, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 0, 'est__act': 'relu'}
Selected features: ['ut_lab4', 'rt_lab4', 'rtr_lab4',

['ut_lab4', 'rt_lab4', 'rtr_lab4', 'cer_lab4', 'mean(qc$_lab4)']

In [None]:
run_process(datalab4, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.930687980266312
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.902947425842285
MSE-test 6.180248845881094
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.05, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 40, 'est__nn1': 20, 'est__nl3': 3, 'est__nl2': 0, 'est__nl1': 1, 'est__lr': 0.001, 'est__l2': 0.003, 'est__l1': 0.003, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['rtr_lab4', 'cer_lab4', 'actq1

['rtr_lab4', 'cer_lab4', 'actq1_lab4', 'mean(qavt$_lab4)', 'mean(qc$_lab4)']

In [None]:
run_process(datalab4, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9251643733906425
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -10.835164070129395
MSE-test 7.017088315442554
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 70, 'est__nn1': 50, 'est__nl3': 1, 'est__nl2': 3, 'est__nl1': 0, 'est__lr': 0.0001, 'est__l2': 0.0001, 'est__l1': 0.003, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 0, 'est__act': 'relu'}
Selected features: ['act_lab4', 'rtr_lab4', 'cer_la

['act_lab4', 'rtr_lab4', 'cer_lab4', 'mean(qg$_lab4)', 'mean(qc$_lab4)']

In [None]:
run_process(datalab4, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.943975715360745
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -9.176057815551758
MSE-test 6.381455677292427
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 40, 'est__nn1': 20, 'est__nl3': 0, 'est__nl2': 1, 'est__nl1': 3, 'est__lr': 0.01, 'est__l2': 0.001, 'est__l1': 0.01, 'est__input_shape': 5, 'est__dropout': 0.1, 'est__decay': 1e-06, 'est__act': 'sigmoid'}
Selected features: ['act_lab4', 'rt_lab4', 'rtr_la

['act_lab4', 'rt_lab4', 'rtr_lab4', 'actq1_lab4', 'mean(qc$_lab4)']

In [None]:
run_process(datalab4, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.924107865755802
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.464548110961914
MSE-test 6.372787834448027
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 70, 'est__nn1': 20, 'est__nl3': 3, 'est__nl2': 2, 'est__nl1': 0, 'est__lr': 0.0001, 'est__l2': 0.0001, 'est__l1': 0.0001, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 0, 'est__act': 'relu'}
Selected features: ['g_lab4', 'rt_lab4', 'rtr_lab4',

['g_lab4', 'rt_lab4', 'rtr_lab4', 'actq1_lab4', 'mean(qmsr$_lab4)']

In [None]:
run_process(datalab4, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.92782586829041
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.660845756530762
MSE-test 5.175385180263577
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 70, 'est__nn1': 20, 'est__nl3': 3, 'est__nl2': 3, 'est__nl1': 2, 'est__lr': 0.0001, 'est__l2': 0.001, 'est__l1': 0.0001, 'est__input_shape': 5, 'est__dropout': 0.1, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['norm_log(dis_lab4)', 'rt_lab4

['norm_log(dis_lab4)', 'rt_lab4', 'cer_lab4', 'actq1_lab4', 'mean(qavt$_lab4)']

In [None]:
run_process(datalab4, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9196255736203645
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -18.066213607788086
MSE-test 5.955807588537583
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 70, 'est__nn1': 50, 'est__nl3': 0, 'est__nl2': 3, 'est__nl1': 1, 'est__lr': 0.0001, 'est__l2': 0.0001, 'est__l1': 0.01, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 0, 'est__act': 'sigmoid'}
Selected features: ['rt_lab4', 'cer_lab4', 'actq1

['rt_lab4', 'cer_lab4', 'actq1_lab4', 'mean(qavt$_lab4)', 'mean(qc$_lab4)']

In [None]:
run_process(datalab4, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.92215451436531
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.260612487792969
MSE-test 5.260612471771458
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.2, 'est__output_shape': 1, 'est__nn3': 15, 'est__nn2': 70, 'est__nn1': 50, 'est__nl3': 1, 'est__nl2': 2, 'est__nl1': 1, 'est__lr': 0.01, 'est__l2': 0, 'est__l1': 0, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['rt_lab4', 'rtr_lab4', 'err_lab4', 'actq2

['rt_lab4', 'rtr_lab4', 'err_lab4', 'actq2_lab4', 'mean(qc$_lab4)']

In [None]:
run_process(datalab4, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.924832306296704
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.804508686065674
MSE-test 5.423649537337166
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.1, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 10, 'est__nn1': 100, 'est__nl3': 1, 'est__nl2': 0, 'est__nl1': 3, 'est__lr': 0.01, 'est__l2': 0.01, 'est__l1': 0, 'est__input_shape': 5, 'est__dropout': 0.2, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['rt_lab4', 'rtr_lab4', 'cer_lab4', '

['rt_lab4', 'rtr_lab4', 'cer_lab4', 'actq1_lab4', 'mean(qc$_lab4)']

In [None]:
run_process(datalab4, rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.912812298011652
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.652135848999023
MSE-test 5.40929847260508
Best params: {'sel__n_features_to_select': 5, 'sel__estimator__learning_rate': 0.05, 'est__output_shape': 1, 'est__nn3': 30, 'est__nn2': 40, 'est__nn1': 50, 'est__nl3': 2, 'est__nl2': 1, 'est__nl1': 3, 'est__lr': 0.0001, 'est__l2': 0.0001, 'est__l1': 0.001, 'est__input_shape': 5, 'est__dropout': 0.3, 'est__decay': 1e-09, 'est__act': 'relu'}
Selected features: ['rt_lab4', 'err_lab4', 'cer_l

['rt_lab4', 'err_lab4', 'cer_lab4', 'actq1_lab4', 'mean(qc$_lab4)']

In [None]:
estimator = model

param_grid = {
    'nl1':            nl1,
    'nl2':            nl2,
    'nl3':            nl3,
    'nn1':            nn1,
    'nn2':            nn2,
    'nn3':            nn3,
    'act':            activation,
    'l1':             l1,
    'l2':             l2,
    'lr':             lr,
    'decay':          decay,
    'dropout':        dropout, 
    'input_shape':    [20],
    'output_shape':   [1]
}

rand_cv = RandomizedSearchCV(estimator=estimator,
                             param_distributions=param_grid,
                             verbose=100,
                             n_iter=10,
                             scoring='neg_mean_squared_error',
                             n_jobs=-1,
                             return_train_score=True,
                             cv=KFold(n_splits=5, shuffle=True))

In [None]:
selected_features_ann_1 = ['actq3_lab1','actq1_lab1','mean(qmsr$_lab1)','rtr_lab1','cer_lab1']
selected_features_ann_2 = ['actq3_lab2','actq1_lab2','mean(qavt$_lab2)','avgtime_lab2','rt_lab2']
selected_features_ann_3 = ['rt_lab3','actq1_lab3','ut_lab3','mean(qact$_lab3)','cer_lab3']
selected_features_ann_4 = ['rt_lab4','cer_lab4','err_lab4','actq1_lab4','mean(qc$_lab4)']

1_2

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.914448891854319
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.147817611694336
MSE-test 5.805909549324682
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 40, 'nn1': 100, 'nl3': 2, 'nl2': 0, 'nl1': 2, 'lr': 0.01, 'l2': 0.001, 'l1': 0.0001, 'input_shape': 10, 'dropout': 0, 'decay': 1e-09, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9262324817175145
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.819202423095703
MSE-test 6.0503530130831
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 70, 'nn1': 100, 'nl3': 0, 'nl2': 1, 'nl1': 1, 'lr': 0.0001, 'l2': 0.0001, 'l1': 0.001, 'input_shape': 10, 'dropout': 0, 'decay': 0, 'act': 'sigmoid'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.917197743307329
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.351170063018799
MSE-test 6.209518135388089
Best params: {'output_shape': 1, 'nn3': 5, 'nn2': 40, 'nn1': 20, 'nl3': 0, 'nl2': 3, 'nl1': 2, 'lr': 0.01, 'l2': 0.001, 'l1': 0, 'input_shape': 10, 'dropout': 0.1, 'decay': 1e-06, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.912251442993624
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.034832000732422
MSE-test 6.915751719699644
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 70, 'nn1': 100, 'nl3': 0, 'nl2': 0, 'nl1': 2, 'lr': 0.001, 'l2': 0.001, 'l1': 0, 'input_shape': 10, 'dropout': 0.1, 'decay': 0, 'act': 'sigmoid'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9241500164555605
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.59423303604126
MSE-test 5.2713025668986
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 40, 'nn1': 20, 'nl3': 2, 'nl2': 2, 'nl1': 0, 'lr': 0.001, 'l2': 0.003, 'l1': 0.0001, 'input_shape': 10, 'dropout': 0.1, 'decay': 1e-06, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.923447544610971
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -8.684288024902344
MSE-test 5.0050803878888575
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 70, 'nn1': 100, 'nl3': 0, 'nl2': 2, 'nl1': 1, 'lr': 0.0001, 'l2': 0.0001, 'l1': 0.003, 'input_shape': 10, 'dropout': 0.3, 'decay': 1e-06, 'act': 'sigmoid'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.907331914757108
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.631399154663086
MSE-test 5.502857847292539
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 70, 'nn1': 20, 'nl3': 2, 'nl2': 2, 'nl1': 1, 'lr': 0.0001, 'l2': 0, 'l1': 0.001, 'input_shape': 10, 'dropout': 0, 'decay': 1e-06, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9294097511859105
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.999378204345703
MSE-test 4.702004105167467
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 70, 'nn1': 20, 'nl3': 0, 'nl2': 3, 'nl1': 2, 'lr': 0.001, 'l2': 0, 'l1': 0.001, 'input_shape': 10, 'dropout': 0.3, 'decay': 1e-09, 'act': 'sigmoid'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.922592611682122
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.083332061767578
MSE-test 5.361429457583458
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 40, 'nn1': 20, 'nl3': 2, 'nl2': 1, 'nl1': 1, 'lr': 0.0001, 'l2': 0.01, 'l1': 0, 'input_shape': 10, 'dropout': 0.2, 'decay': 1e-09, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.926126723965541
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.318737030029297
MSE-test 6.086149926593753
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 40, 'nn1': 20, 'nl3': 0, 'nl2': 1, 'nl1': 3, 'lr': 0.0001, 'l2': 0.003, 'l1': 0, 'input_shape': 10, 'dropout': 0.1, 'decay': 1e-09, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2']



---



1_2_3

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.942257119036137
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.235172748565674
MSE-test 5.8096365725676105
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 40, 'nn1': 20, 'nl3': 0, 'nl2': 3, 'nl1': 1, 'lr': 0.01, 'l2': 0.003, 'l1': 0.0001, 'input_shape': 15, 'dropout': 0, 'decay': 0, 'act': 'sigmoid'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9144530134567255
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.7043776512146
MSE-test 6.125266799825735
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 70, 'nn1': 20, 'nl3': 2, 'nl2': 3, 'nl1': 3, 'lr': 0.001, 'l2': 0, 'l1': 0.001, 'input_shape': 15, 'dropout': 0.2, 'decay': 1e-09, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.921640892976978
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -12.183568000793457
MSE-test 6.507409505889915
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 70, 'nn1': 20, 'nl3': 1, 'nl2': 3, 'nl1': 0, 'lr': 0.0001, 'l2': 0.01, 'l1': 0.003, 'input_shape': 15, 'dropout': 0.2, 'decay': 0, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.916116805053997
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.6438889503479
MSE-test 5.981943116582992
Best params: {'output_shape': 1, 'nn3': 5, 'nn2': 40, 'nn1': 100, 'nl3': 0, 'nl2': 2, 'nl1': 2, 'lr': 0.0001, 'l2': 0.003, 'l1': 0, 'input_shape': 15, 'dropout': 0.1, 'decay': 1e-09, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.915612985775448
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -18.173477172851562
MSE-test 4.915467160343942
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 40, 'nn1': 50, 'nl3': 2, 'nl2': 2, 'nl1': 3, 'lr': 0.0001, 'l2': 0.0001, 'l1': 0.01, 'input_shape': 15, 'dropout': 0.2, 'decay': 0, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.921255698228536
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.446985244750977
MSE-test 6.06316729344923
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 70, 'nn1': 50, 'nl3': 0, 'nl2': 1, 'nl1': 2, 'lr': 0.01, 'l2': 0.003, 'l1': 0, 'input_shape': 15, 'dropout': 0.1, 'decay': 1e-09, 'act': 'sigmoid'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9221207916939065
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -13.002572059631348
MSE-test 6.313670651017777
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 70, 'nn1': 100, 'nl3': 1, 'nl2': 2, 'nl1': 2, 'lr': 0.0001, 'l2': 0, 'l1': 0.003, 'input_shape': 15, 'dropout': 0.1, 'decay': 0, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.9349567343215535
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.186581611633301
MSE-test 6.159387666480008
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 10, 'nn1': 50, 'nl3': 2, 'nl2': 2, 'nl1': 0, 'lr': 0.0001, 'l2': 0, 'l1': 0.0001, 'input_shape': 15, 'dropout': 0, 'decay': 0, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.921971885267638
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.0976433753967285
MSE-test 6.017182556573594
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 10, 'nn1': 20, 'nl3': 3, 'nl2': 2, 'nl1': 1, 'lr': 0.001, 'l2': 0.01, 'l1': 0, 'input_shape': 15, 'dropout': 0, 'decay': 1e-06, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.912984736600876
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.092894554138184
MSE-test 5.092894642076721
Best params: {'output_shape': 1, 'nn3': 5, 'nn2': 10, 'nn1': 50, 'nl3': 0, 'nl2': 2, 'nl1': 3, 'lr': 0.001, 'l2': 0, 'l1': 0, 'input_shape': 15, 'dropout': 0, 'decay': 1e-09, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3']



---



1_2_3_4

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3]).join(datalab4[selected_features_ann_4])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.902900277353085
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -7.173131942749023
MSE-test 6.350189299537313
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 10, 'nn1': 50, 'nl3': 3, 'nl2': 1, 'nl1': 1, 'lr': 0.001, 'l2': 0.01, 'l1': 0, 'input_shape': 20, 'dropout': 0.1, 'decay': 1e-06, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3]).join(datalab4[selected_features_ann_4])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.902254612422867
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.727807998657227
MSE-test 6.70688847098273
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 70, 'nn1': 20, 'nl3': 3, 'nl2': 2, 'nl1': 0, 'lr': 0.001, 'l2': 0.0001, 'l1': 0, 'input_shape': 20, 'dropout': 0.3, 'decay': 1e-09, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3]).join(datalab4[selected_features_ann_4])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.907100579253426
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -5.191622257232666
MSE-test 4.8721048063577115
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 70, 'nn1': 20, 'nl3': 3, 'nl2': 1, 'nl1': 1, 'lr': 0.0001, 'l2': 0.003, 'l1': 0, 'input_shape': 20, 'dropout': 0.3, 'decay': 1e-09, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3]).join(datalab4[selected_features_ann_4])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.912414085588108
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.190826416015625
MSE-test 6.065711864422466
Best params: {'output_shape': 1, 'nn3': 5, 'nn2': 70, 'nn1': 100, 'nl3': 2, 'nl2': 3, 'nl1': 0, 'lr': 0.001, 'l2': 0, 'l1': 0.0001, 'input_shape': 20, 'dropout': 0, 'decay': 1e-06, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3]).join(datalab4[selected_features_ann_4])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.909600476061483
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -9.45512866973877
MSE-test 6.630978928418805
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 70, 'nn1': 100, 'nl3': 2, 'nl2': 0, 'nl1': 3, 'lr': 0.01, 'l2': 0.01, 'l1': 0.0001, 'input_shape': 20, 'dropout': 0.2, 'decay': 0, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3]).join(datalab4[selected_features_ann_4])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.912708684488838
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.977842807769775
MSE-test 5.9972424174487236
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 40, 'nn1': 50, 'nl3': 0, 'nl2': 3, 'nl1': 1, 'lr': 0.01, 'l2': 0.001, 'l1': 0.001, 'input_shape': 20, 'dropout': 0.1, 'decay': 0, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3]).join(datalab4[selected_features_ann_4])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.927071087513601
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -8.773417472839355
MSE-test 5.784366552244696
Best params: {'output_shape': 1, 'nn3': 30, 'nn2': 10, 'nn1': 50, 'nl3': 2, 'nl2': 1, 'nl1': 3, 'lr': 0.001, 'l2': 0, 'l1': 0.003, 'input_shape': 20, 'dropout': 0, 'decay': 0, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3]).join(datalab4[selected_features_ann_4])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.914990522504689
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -6.515824317932129
MSE-test 6.435477203576395
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 40, 'nn1': 20, 'nl3': 1, 'nl2': 3, 'nl1': 0, 'lr': 0.0001, 'l2': 0.0001, 'l1': 0.0001, 'input_shape': 20, 'dropout': 0, 'decay': 0, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3]).join(datalab4[selected_features_ann_4])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.906700291775987
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -8.382675170898438
MSE-test 5.484680984897574
Best params: {'output_shape': 1, 'nn3': 15, 'nn2': 40, 'nn1': 50, 'nl3': 1, 'nl2': 3, 'nl1': 1, 'lr': 0.001, 'l2': 0.001, 'l1': 0.003, 'input_shape': 20, 'dropout': 0.3, 'decay': 1e-09, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']

In [None]:
dataset = datalab1[[TARGET] + selected_features_ann_1].join(datalab2[selected_features_ann_2]).join(datalab3[selected_features_ann_3]).join(datalab4[selected_features_ann_4])
run_process(dataset,rand_cv)

Fitting 5 folds for each of 10 candidates, totalling 50 fits
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test-fit: -5.920223681986343
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
R2-test -8.550341606140137
MSE-test 6.233280008722865
Best params: {'output_shape': 1, 'nn3': 5, 'nn2': 70, 'nn1': 50, 'nl3': 0, 'nl2': 3, 'nl1': 1, 'lr': 0.001, 'l2': 0.01, 'l1': 0.0001, 'input_shape': 20, 'dropout': 0.2, 'decay': 0, 'act': 'relu'}


['actq3_lab1',
 'actq1_lab1',
 'mean(qmsr$_lab1)',
 'rtr_lab1',
 'cer_lab1',
 'actq3_lab2',
 'actq1_lab2',
 'mean(qavt$_lab2)',
 'avgtime_lab2',
 'rt_lab2',
 'rt_lab3',
 'actq1_lab3',
 'ut_lab3',
 'mean(qact$_lab3)',
 'cer_lab3',
 'rt_lab4',
 'cer_lab4',
 'err_lab4',
 'actq1_lab4',
 'mean(qc$_lab4)']