In [1]:
import numpy as np
import pandas as pd

from sklearn.impute import (SimpleImputer,KNNImputer)
from sklearn.ensemble import (RandomForestRegressor, IsolationForest)
from sklearn.neighbors import LocalOutlierFactor
from sklearn.model_selection import KFold
from sklearn.model_selection import train_test_split
from sklearn.neural_network import MLPRegressor
from sklearn.ensemble import ExtraTreesRegressor
import lightgbm as lgb

from sklearn.gaussian_process import GaussianProcessRegressor
from sklearn.gaussian_process.kernels import RBF, ConstantKernel as C, DotProduct, WhiteKernel, RationalQuadratic, Matern
from sklearn.metrics import r2_score

import matplotlib.pyplot as plt

%matplotlib inline

In [2]:
def fill_missing_values(X, n_neighbors = 75, method="KNN"): 
    
    # normalization
    X_std = np.nanstd(X,axis=0,keepdims=True)
    X_ave = np.nanmean(X,axis=0,keepdims=True)
    X_norma = (X-X_ave)/X_std
    
    # use KNNImputer
    imputer = KNNImputer(missing_values=np.nan, n_neighbors=n_neighbors, weights = 'distance') if method=="KNN"\
        else SimpleImputer(missing_values=np.nan, strategy='median')
    
    X_norma_fixed = imputer.fit_transform(X_norma)
    
    return X_norma_fixed

def remove_outliers(X, y):
    print("IsolationForest-Traing data shape before removed: {}".format(X.shape))
    Z = np.c_[X, y]
    iforest = IsolationForest(max_samples=200, random_state=1, contamination=0.005)
    iforest.fit(Z)
    iforest_outlier_pred = iforest.predict(Z)
    
    Z = np.c_[X, y]
    local = LocalOutlierFactor(n_neighbors=150, contamination=0.005)
    local.fit(Z)
    local_outlier_pred = local.fit_predict(Z)

    mask = np.logical_and((iforest_outlier_pred!=-1), (local_outlier_pred!=-1))
    X , y = X[mask, :], y[mask]
    print("IsolationForest-Traing data shape after removed: {}".format(X.shape))
    return X, y

def select_features(X, y, X_test, feature_num=50, n_estimators=80):
    rf = RandomForestRegressor(n_jobs=-1, n_estimators=80, random_state=1)
    rf.fit(X, y)
    indices = np.asarray(list(rf.feature_importances_)).argsort()[-feature_num:][::-1]
    
    X = np.take(X, indices, axis = 1)
    X_test = np.take(X_test, indices, axis = 1)
    return X, X_test

In [3]:
X_train_data = pd.read_csv('X_train.csv')
y_train_data = pd.read_csv('y_train.csv')
X_test_data = pd.read_csv('X_test.csv')

indices_test = np.array(X_test_data)[:,0]
X_test = np.array(X_test_data)[:,1:]
y_train = np.array(y_train_data)[:,1]
X_train = np.array(X_train_data)[:,1:]

In [4]:
X_train_missing_indices = X_train[X_train==np]
X_train = fill_missing_values(X_train, n_neighbors=75)
X_test_processed = fill_missing_values(X_test)
print(X_train.shape)
print(X_test_processed.shape)

  
  


(1212, 828)
(776, 828)


In [5]:

X_processed,y_processed = remove_outliers(X_train,y_train)

IsolationForest-Traing data shape before removed: (1212, 828)
IsolationForest-Traing data shape after removed: (1200, 828)


In [6]:
# pearsonr feature selection
from scipy.stats import pearsonr
from sklearn.decomposition import PCA

def pearsonr_feature_selection(X, y, X_test,degree,weights):
    feature_idx =  np.array([i for i in range(0,X.shape[1])])
    correlations = {}
#     print("feature_idx: ", feature_idx.T)
    for idx in feature_idx:
        correlation = 0
        for degree_idx in range(0,len(weights)):
            correlation += abs(weights[degree_idx]*pearsonr(X[:,idx],y**degree[degree_idx])[0])
        correlations[idx] = correlation
    data_correlations = pd.DataFrame(correlations, index=['correlation']).T
    indices_desc = data_correlations['correlation'].abs().sort_values(ascending=False).index
#     print(indices_desc)
    return data_correlations,indices_desc

def pearsonr_feature_selection_correlation(X, X_test,threshold):
    feature_idx =  np.array([i for i in range(0,X.shape[1])])
    correlation_select = np.array([True for i in range(0,X.shape[1])])
    for f_idx in feature_idx:
        if(correlation_select[f_idx]):
            feature_co,indices_desc = pearsonr_feature_selection(X[:,(f_idx+1):], X[:,f_idx], X_test_processed,np.array([1]),np.array([1]))
            reomove_features = feature_co.loc[indices_desc][abs(feature_co['correlation']) >= threshold]
            remove_index = reomove_features.index+(f_idx+1)
            correlation_select[remove_index] = False
    
    return X[:,correlation_select],X_test[:,correlation_select]

In [7]:
def LGB_feature_selection(X_processed,X_test_processed,y_processed):
    data_relation,indices_desc = pearsonr_feature_selection(X_processed, y_processed, X_test_processed,np.array([1,-3,3]),np.array([0.9,0.05,0.05]))
    selected_features = data_relation.loc[indices_desc][abs(data_relation['correlation']) >= 0.025]
    X_selection = X_processed[:,selected_features.index]
    X_test_selection = X_test_processed[:,selected_features.index]
    X_selection_tree, X_test_selection_tree = select_features(X_selection, y_processed, X_test_selection,feature_num = 105)
    X_selection_tree_cor, X_test_selection_tree_cor = pearsonr_feature_selection_correlation(X_selection_tree, X_test_selection_tree,0.93)
    return X_selection_tree_cor,X_test_selection_tree_cor

In [8]:
def GP_feature_selection(X_processed,X_test_processed,y_processed, tree_num = 43):
    data_relation,indices_desc = pearsonr_feature_selection(X_processed, y_processed, X_test_processed,np.array([1,-3,3]),np.array([0.95,0.025,0.025]))
    selected_features = data_relation.loc[indices_desc][abs(data_relation['correlation']) >= 0.001]
    X_selection = X_processed[:,selected_features.index]
    X_test_selection = X_test_processed[:,selected_features.index]
    X_selection_tree, X_test_selection_tree = select_features(X_selection, y_processed, X_test_selection,feature_num = tree_num)
    X_selection_tree_cor, X_test_selection_tree_cor = pearsonr_feature_selection_correlation(X_selection_tree, X_test_selection_tree,0.96)
    return X_selection_tree_cor,X_test_selection_tree_cor

In [11]:
def GP_rbf_feature_selection(X_processed,X_test_processed,y_processed,feature_num):
    data_relation,indices_desc = pearsonr_feature_selection(X_processed, y_processed, X_test_processed,np.array([1,-3,3]),np.array([0.95,0.025,0.025]))
    selected_features = data_relation.loc[indices_desc][abs(data_relation['correlation']) >= 0.001]
    X_selection = X_processed[:,selected_features.index]
    X_test_selection = X_test_processed[:,selected_features.index]
    X_selection_tree, X_test_selection_tree = select_features(X_selection, y_processed, X_test_selection,feature_num)
    X_selection_tree_cor, X_test_selection_tree_cor = pearsonr_feature_selection_correlation(X_selection_tree, X_test_selection_tree,0.96)
    return X_selection_tree_cor,X_test_selection_tree_cor

In [12]:

def Tree_feature_selection(X_processed,X_test_processed,y_processed):
    data_relation,indices_desc = pearsonr_feature_selection(X_processed, y_processed, X_test_processed,np.array([1,-3,3]),np.array([0.95,0.025,0.025]))
    selected_features = data_relation.loc[indices_desc][abs(data_relation['correlation']) >= 0.1]
    X_selection = X_processed[:,selected_features.index]
    X_test_selection = X_test_processed[:,selected_features.index]
    X_selection_tree, X_test_selection_tree = select_features(X_selection, y_processed, X_test_selection,feature_num = 50, n_estimators= 100)
    X_selection_tree_cor, X_test_selection_tree_cor = pearsonr_feature_selection_correlation(X_selection_tree, X_test_selection_tree,0.96)
    return X_selection_tree_cor,X_test_selection_tree_cor

In [13]:

X_lgb,X_test_lgb = LGB_feature_selection(X_processed,X_test_processed,y_processed)
print(X_lgb.shape)
print(X_test_lgb.shape)

  This is separate from the ipykernel package so we can avoid doing imports until


(1200, 98)
(776, 98)


In [14]:
X_gp_quad,X_test_gp_quad = GP_feature_selection(X_processed,X_test_processed,y_processed)
print(X_gp_quad.shape)
print(X_test_gp_quad.shape)

  This is separate from the ipykernel package so we can avoid doing imports until


(1200, 42)
(776, 42)




In [27]:
X_gp_rbf,X_test_gp_rbf = GP_rbf_feature_selection(X_processed,X_test_processed,y_processed,64)
print(X_gp_rbf.shape)

  This is separate from the ipykernel package so we can avoid doing imports until


(1200, 58)


In [74]:
from sklearn.gaussian_process import GaussianProcessRegressor
from sklearn.gaussian_process.kernels import RBF, ConstantKernel as C, DotProduct, WhiteKernel

def custom_r2(prediction, train_data):
    """Regular r2 cost function returned as a tuple to be used with lgb"""
    labels = train_data.get_label()
    return 'r2', r2_score(labels, prediction), True

def fit_model_and_pred(X_train, y_train, X_val, y_val, X_test):
#     kernel = RBF(0.5, (1e-4, 10))
#     gpr = GaussianProcessRegressor(kernel=kernel, random_state=0, n_restarts_optimizer=1, alpha=0.07, normalize_y=True)
#     gpr.fit(X_train, y_train)
#     score = gpr.score(X_val, y_val)   
#     y_pred = gpr.predict(X_test) 
    kernel = RationalQuadratic(length_scale=0.5, alpha=1.0, length_scale_bounds=(1e-4, 10))
    gpr = GaussianProcessRegressor(kernel=kernel, random_state=0, n_restarts_optimizer=1, alpha=1e-6, normalize_y=True)
    gpr.fit(X_train, y_train)
    score = gpr.score(X_val, y_val)
    y_val_pred = gpr.predict(X_val)   
    y_pred = gpr.predict(X_test)
    
    return score, y_pred

def fit_model_and_pred_gp2(X_train, y_train, X_val, y_val, X_test,length,u):
    # kernel = RBF(0.5, (1e-4, 10))
    kernel = Matern(length_scale = length,nu=u)
    gpr = GaussianProcessRegressor(kernel=kernel, random_state=0, n_restarts_optimizer=1, alpha=1e-4, normalize_y=True)
    gpr.fit(X_train, y_train)
    score = gpr.score(X_val, y_val)   
    y_pred = gpr.predict(X_test) 
    
    return score, y_pred

def fit_model_and_pred_tree(X_train, y_train, X_val, y_val, X_test, random_state=0):
    model = ExtraTreesRegressor(n_jobs=1, max_depth=None, n_estimators=190, random_state=random_state, min_samples_split=3, max_features=None)
    model.fit(X_train, y_train)
    
    y_val_pred = model.predict(X_val)
    score = r2_score(y_val, y_val_pred)
    
    y_pred = model.predict(X_test) 
    
    return score, y_pred

def fit_model_and_pred_lgb(X_train, y_train, X_val, y_val, X_test):
   
    params = {
        'task': 'train',
        'boosting_type': 'gbdt',
        'objective': 'regression',
        'num_leaves': 1800,
        'learning_rate': 0.025,
        'max_depth': 11,
        'n_estimators': 1000,
        'min_child_weight': 1,
        'subsample': 0.8,
        'colsample_bytree': 0.8,
        'feature_fraction': 0.5,
        'bagging_fraction': 0.8,
        'bagging_freq': 5,
        'verbose': -1,
        'num_iterations':1000,
    }  
    
    
    lgb_train = lgb.Dataset(X_train, y_train)
    lgb_eval = lgb.Dataset(X_val, y_val, reference=lgb_train)

    gbm = lgb.train(params,
                    lgb_train,
                    num_boost_round=500,
                    feval=custom_r2,
                    valid_sets={lgb_train, lgb_eval},
                    early_stopping_rounds=100,
                    verbose_eval=False
                   )
    
    y_val_pred = gbm.predict(X_val)
    score = r2_score(y_val, y_val_pred)
    y_pred = gbm.predict(X_test) 
    return score, y_pred

def train_k_fold_2GP_LGB(X_lgb,X_test_lgb,X_gp,X_test_gp,X_tree,X_test_tree, y , weight1 = 0.5, weight2 = 0.75, fold_num=10,l = 0.9,u = 2.0):
# weight1 is the ratio of gp_rbf to lgb, weight2 is the combine of previous to gp.quadric
    kf = KFold(n_splits=fold_num, shuffle=True)
    kf.get_n_splits(X_lgb)
    test_score = 0.0
    train_score = 0.0
    y_test_pred = np.zeros((X_test_lgb.shape[0]))
#     print("shape of y_test_pred:", y_test_pred.shape)
    i = 0
    for train_index, test_index in kf.split(X_lgb):
        X_lgb_train, X_lgb_val = X_lgb[train_index], X_lgb[test_index]
        X_gp_train, X_gp_val = X_gp[train_index], X_gp[test_index]
        X_tree_train, X_tree_val = X_tree[train_index], X_tree[test_index]
        y_train, y_val = y[train_index], y[test_index]
        
        _, y_pred1 = fit_model_and_pred(X_gp_train, y_train, X_gp_val, y_val, X_gp_val)
        _, y_pred2 = fit_model_and_pred_lgb(X_lgb_train, y_train, X_lgb_val, y_val, X_lgb_val)
        _, y_pred3 = fit_model_and_pred_gp2(X_tree_train, y_train, X_tree_val, y_val, X_tree_val,l,u)
#         _, y_pred4 = fit_model_and_pred_tree(X_tree_train, y_train, X_tree_val, y_val, X_tree_val)
        y_pred = weight2*(weight1*y_pred3+(1-weight1)*y_pred2) + (1-weight2)*y_pred1

        _, y_test_pred1 = fit_model_and_pred(X_gp_train, y_train, X_gp_val, y_val, X_test_gp)
        _, y_test_pred2 = fit_model_and_pred_lgb(X_lgb_train, y_train, X_lgb_val, y_val, X_test_lgb)
        _, y_test_pred3 = fit_model_and_pred_gp2(X_tree_train, y_train, X_tree_val, y_val, X_test_tree,l,u)
#         _, y_test_pred4 = fit_model_and_pred_tree(X_tree_train, y_train, X_tree_val, y_val, X_test_tree)
        y_test_pred += weight2*(weight1*y_test_pred3+(1-weight1)*y_test_pred2) + (1-weight2)*y_test_pred1
        
        score = r2_score(y_val, y_pred)
        print(i+1, 'th . the obtained validation r2 score is : ',score)
        test_score += score
        i += 1

    return test_score/fold_num,y_test_pred/fold_num

def train_k_fold_predict(X, y, X_test, fold_num=10):
    kf = KFold(n_splits=fold_num)
    kf.get_n_splits(X)
    y_test_predict = np.zeros(X_test.shape[0])
    cnt = 0
    val_score = 0.0
    train_score = 0.0
    for train_index, test_index in kf.split(X):
        X_train, X_val = X[train_index], X[test_index]
        y_train, y_val = y[train_index], y[test_index]

        score, y_pred = fit_model_and_pred(X_train, y_train, X_val, y_val, X_test) 
        val_score += score
        y_test_predict += y_pred
        
        score, _ = fit_model_and_pred(X_train, y_train, X_train, y_train, X_test)
        train_score += score
    return train_score/fold_num, val_score/fold_num, y_test_predict/fold_num

In [55]:

score,prediction = train_k_fold_2GP_LGB(X_lgb,X_test_lgb,X_gp_quad,X_test_gp_quad,X_gp_rbf,X_test_gp_rbf, y_processed , weight1 = 0.578, weight2 = 0.65, fold_num=10,l = 0.75)







1 th . the obtained validation r2 score is :  0.800072992914019








2 th . the obtained validation r2 score is :  0.8070553755541002








3 th . the obtained validation r2 score is :  0.6284994619188715








4 th . the obtained validation r2 score is :  0.7443734183151861








5 th . the obtained validation r2 score is :  0.6776789130038956








6 th . the obtained validation r2 score is :  0.6936794281141399








7 th . the obtained validation r2 score is :  0.6071908575977656








8 th . the obtained validation r2 score is :  0.6539246858622471








9 th . the obtained validation r2 score is :  0.7604872254571488








10 th . the obtained validation r2 score is :  0.6319385336135754


In [56]:
score

0.7004900892350949

In [57]:
prediction

array([67.65319431, 70.01509607, 69.51539781, 70.9811512 , 70.65939111,
       75.53765846, 62.12317666, 60.48444525, 81.04395841, 78.69547651,
       58.72525806, 82.08690913, 71.06894405, 81.51937457, 55.05182346,
       82.0105325 , 70.15466011, 74.61068456, 71.45108654, 69.68515745,
       69.87226425, 65.37889147, 79.79506309, 75.35995375, 61.13514404,
       70.80308044, 55.22519037, 71.72866974, 64.89418503, 73.2879932 ,
       64.19202888, 70.47095104, 57.61501228, 70.46181706, 66.99879078,
       65.17636383, 76.23560815, 56.3154662 , 71.71253169, 69.31845484,
       71.18793549, 74.42565416, 71.62874018, 80.21398862, 73.25547274,
       67.20032589, 69.22230878, 72.78131458, 77.05102053, 70.40157776,
       76.67071353, 66.10462617, 61.15916392, 81.98171761, 77.36012093,
       73.69284787, 63.54207814, 71.56020489, 72.93160486, 60.97846784,
       64.90057113, 74.20053444, 63.79494774, 72.11756236, 72.96248559,
       57.48949682, 69.76591954, 79.0710904 , 63.32922555, 74.64

In [59]:
final_res = np.vstack((indices_test, prediction)).T
df_res = pd.DataFrame(final_res)
df_res.to_csv("our_result_0.7005.csv", header = ["id", "y"], index=False)

In [19]:
feature_trial = [48+2*i for i in range(0,10)]
y_pred_trial = np.zeros((X_test_gp_rbf.shape[0],len(feature_trial)))
score_trial = np.zeros(len(feature_trial))

for i in range(0,len(feature_trial)):
    X_gp_rbf,X_test_gp_rbf = GP_rbf_feature_selection(X_processed,X_test_processed,y_processed,feature_trial[i])
    score_trial[i],y_pred_trial[:,i] = train_k_fold_2GP_LGB(X_lgb,X_test_lgb,X_gp_quad,X_test_gp_quad,X_gp_rbf,X_test_gp_rbf, y_processed , weight1 = 0.578, weight2 = 0.68, fold_num=10)

  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.7895256732139873








2 th . the obtained validation r2 score is :  0.8022019300926344








3 th . the obtained validation r2 score is :  0.6200933623680842








4 th . the obtained validation r2 score is :  0.75707989775554








5 th . the obtained validation r2 score is :  0.6750947023669784








6 th . the obtained validation r2 score is :  0.6867342328564862








7 th . the obtained validation r2 score is :  0.6138977132228037








8 th . the obtained validation r2 score is :  0.6526652594299583








9 th . the obtained validation r2 score is :  0.7582602203439389








10 th . the obtained validation r2 score is :  0.6258674546574765


  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.7896087525548613








2 th . the obtained validation r2 score is :  0.8018125347296037








3 th . the obtained validation r2 score is :  0.6233080863386606








4 th . the obtained validation r2 score is :  0.7520045678395852








5 th . the obtained validation r2 score is :  0.6779023078410753








6 th . the obtained validation r2 score is :  0.6889122402902987








7 th . the obtained validation r2 score is :  0.6110816811533135








8 th . the obtained validation r2 score is :  0.6512601265544675








9 th . the obtained validation r2 score is :  0.7604636266737196








10 th . the obtained validation r2 score is :  0.6258008072915808


  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.7906719180685275








2 th . the obtained validation r2 score is :  0.8006701191795749








3 th . the obtained validation r2 score is :  0.6246024123807092








4 th . the obtained validation r2 score is :  0.7509641365939506








5 th . the obtained validation r2 score is :  0.6757838704234133








6 th . the obtained validation r2 score is :  0.6894891504512846








7 th . the obtained validation r2 score is :  0.6098496209440496








8 th . the obtained validation r2 score is :  0.6512793238648104








9 th . the obtained validation r2 score is :  0.7604928492585691








10 th . the obtained validation r2 score is :  0.6251630759447074


  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.7907270218262924








2 th . the obtained validation r2 score is :  0.8033402763350287








3 th . the obtained validation r2 score is :  0.6265472016489267








4 th . the obtained validation r2 score is :  0.7478400594550585








5 th . the obtained validation r2 score is :  0.6775664731443021








6 th . the obtained validation r2 score is :  0.6913990116746457








7 th . the obtained validation r2 score is :  0.6113854913474869








8 th . the obtained validation r2 score is :  0.6515266146139517








9 th . the obtained validation r2 score is :  0.7632023798026937








10 th . the obtained validation r2 score is :  0.6226237572091387


  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.7918345104806969








2 th . the obtained validation r2 score is :  0.8021745991240882








3 th . the obtained validation r2 score is :  0.6271360483696846








4 th . the obtained validation r2 score is :  0.7450944620397627








5 th . the obtained validation r2 score is :  0.6777573838127784








6 th . the obtained validation r2 score is :  0.6897264269259225








7 th . the obtained validation r2 score is :  0.6091202515902441








8 th . the obtained validation r2 score is :  0.6552565358331481








9 th . the obtained validation r2 score is :  0.7626657033466647








10 th . the obtained validation r2 score is :  0.6220078613161442


  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.7974113489744766








2 th . the obtained validation r2 score is :  0.8045450206912679








3 th . the obtained validation r2 score is :  0.6326857361375255








4 th . the obtained validation r2 score is :  0.7466481186558473








5 th . the obtained validation r2 score is :  0.6736834366820519








6 th . the obtained validation r2 score is :  0.6922131085521089








7 th . the obtained validation r2 score is :  0.6076237930970968








8 th . the obtained validation r2 score is :  0.6526385020487846








9 th . the obtained validation r2 score is :  0.7634494003439068








10 th . the obtained validation r2 score is :  0.6233751875027078


  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.7994379621535113








2 th . the obtained validation r2 score is :  0.805400650196155








3 th . the obtained validation r2 score is :  0.6277214853123136








4 th . the obtained validation r2 score is :  0.7464994889455785








5 th . the obtained validation r2 score is :  0.6749616336671005








6 th . the obtained validation r2 score is :  0.6950204456189597








7 th . the obtained validation r2 score is :  0.603907601293079








8 th . the obtained validation r2 score is :  0.6499355210601943








9 th . the obtained validation r2 score is :  0.7637655700065056








10 th . the obtained validation r2 score is :  0.6240359812126235


  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.797614434328084








2 th . the obtained validation r2 score is :  0.8052620930684368








3 th . the obtained validation r2 score is :  0.6317403884808493








4 th . the obtained validation r2 score is :  0.7433993139477623








5 th . the obtained validation r2 score is :  0.6765974880593199








6 th . the obtained validation r2 score is :  0.6949808410880114








7 th . the obtained validation r2 score is :  0.6018250363288677








8 th . the obtained validation r2 score is :  0.6508028594767461








9 th . the obtained validation r2 score is :  0.762849280093146








10 th . the obtained validation r2 score is :  0.6260878843182036


  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.7993123444958584








2 th . the obtained validation r2 score is :  0.8071335360029194








3 th . the obtained validation r2 score is :  0.6326797769972596








4 th . the obtained validation r2 score is :  0.7432428862891243








5 th . the obtained validation r2 score is :  0.6767290809800501








6 th . the obtained validation r2 score is :  0.6948633918388529








7 th . the obtained validation r2 score is :  0.6052317981183211








8 th . the obtained validation r2 score is :  0.6524831205648354








9 th . the obtained validation r2 score is :  0.7604584044857199








10 th . the obtained validation r2 score is :  0.6303257579563437


  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.7984161719141813








2 th . the obtained validation r2 score is :  0.8093414621757706








3 th . the obtained validation r2 score is :  0.6285381371937375








4 th . the obtained validation r2 score is :  0.7432773930956126








5 th . the obtained validation r2 score is :  0.6803767815889823








6 th . the obtained validation r2 score is :  0.696713954920098








7 th . the obtained validation r2 score is :  0.6060111294328351








8 th . the obtained validation r2 score is :  0.6529388219792274








9 th . the obtained validation r2 score is :  0.758751576731316








10 th . the obtained validation r2 score is :  0.6262727202749909


In [25]:
score_trial[8]

0.7002460097729285

In [26]:
final_res = np.vstack((indices_test, y_pred_trial[:,8])).T
df_res = pd.DataFrame(final_res)
df_res.to_csv("our_result_0.7002.csv", header = ["id", "y"], index=False)

In [21]:
feature_trial

[48, 50, 52, 54, 56, 58, 60, 62, 64, 66]

In [23]:
feature_trial2 = [65,67,68]
y_pred_trial2 = np.zeros((X_test_gp_rbf.shape[0],len(feature_trial)))
score_trial2 = np.zeros(len(feature_trial))

for i in range(0,len(feature_trial)):
    X_gp_rbf,X_test_gp_rbf = GP_rbf_feature_selection(X_processed,X_test_processed,y_processed,feature_trial2[i])
    score_trial2[i],y_pred_trial2[:,i] = train_k_fold_2GP_LGB(X_lgb,X_test_lgb,X_gp_quad,X_test_gp_quad,X_gp_rbf,X_test_gp_rbf, y_processed , weight1 = 0.578, weight2 = 0.68, fold_num=10)

  This is separate from the ipykernel package so we can avoid doing imports until


1 th . the obtained validation r2 score is :  0.799946697378753








2 th . the obtained validation r2 score is :  0.8072200262840967








3 th . the obtained validation r2 score is :  0.6303004506424399








4 th . the obtained validation r2 score is :  0.7421803583541908








5 th . the obtained validation r2 score is :  0.6783329535128333








6 th . the obtained validation r2 score is :  0.6960218943610725








7 th . the obtained validation r2 score is :  0.6052494825548528








8 th . the obtained validation r2 score is :  0.6507515309790195








9 th . the obtained validation r2 score is :  0.758335342118937








10 th . the obtained validation r2 score is :  0.6268755984235084


  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.7969589947878654








2 th . the obtained validation r2 score is :  0.8073327990209246








3 th . the obtained validation r2 score is :  0.6290250914455021








4 th . the obtained validation r2 score is :  0.7437209504218778








5 th . the obtained validation r2 score is :  0.6791968897494822








6 th . the obtained validation r2 score is :  0.696176138679913








7 th . the obtained validation r2 score is :  0.6065235294698601








8 th . the obtained validation r2 score is :  0.6532824864598377








9 th . the obtained validation r2 score is :  0.7596104312520406








10 th . the obtained validation r2 score is :  0.6270185334776264


  This is separate from the ipykernel package so we can avoid doing imports until






1 th . the obtained validation r2 score is :  0.7963842234247603








2 th . the obtained validation r2 score is :  0.806979497169214








3 th . the obtained validation r2 score is :  0.6287633600285334








4 th . the obtained validation r2 score is :  0.7426268750509347








5 th . the obtained validation r2 score is :  0.678686685653779








6 th . the obtained validation r2 score is :  0.6965768116595245








7 th . the obtained validation r2 score is :  0.607794501200583








8 th . the obtained validation r2 score is :  0.6531043056535387








9 th . the obtained validation r2 score is :  0.7591999795077394








10 th . the obtained validation r2 score is :  0.6261356284555128


IndexError: list index out of range

In [24]:
score_trial2

array([0.69952143, 0.69988458, 0.69962519, 0.        , 0.        ,
       0.        , 0.        , 0.        , 0.        , 0.        ])

In [35]:
weight_trial = [0.63,0.65]
y_pred_trial3 = np.zeros((X_test_lgb.shape[0],len(weight_trial)))
score_trial3 = np.zeros(len(weight_trial))

for i in range(0,len(weight_trial)):
    score_trial3[i],y_pred_trial3[:,i] = train_k_fold_2GP_LGB(X_lgb,X_test_lgb,X_gp_quad,X_test_gp_quad,X_gp_rbf,X_test_gp_rbf, y_processed , weight1 = 0.578, weight2 = weight_trial[i], fold_num=10)







1 th . the obtained validation r2 score is :  0.7993367968067429








2 th . the obtained validation r2 score is :  0.8064344315917776








3 th . the obtained validation r2 score is :  0.630322131841616








4 th . the obtained validation r2 score is :  0.745122505316859








5 th . the obtained validation r2 score is :  0.6772955493974762








6 th . the obtained validation r2 score is :  0.6943690887548992








7 th . the obtained validation r2 score is :  0.6065896446430481








8 th . the obtained validation r2 score is :  0.6536185363777935








9 th . the obtained validation r2 score is :  0.7604790369188428








10 th . the obtained validation r2 score is :  0.6295094555345687








1 th . the obtained validation r2 score is :  0.7993439630739683








2 th . the obtained validation r2 score is :  0.8067333642953023








3 th . the obtained validation r2 score is :  0.6312833270593954








4 th . the obtained validation r2 score is :  0.7443882487450628








5 th . the obtained validation r2 score is :  0.6770900370059957








6 th . the obtained validation r2 score is :  0.694579439736243








7 th . the obtained validation r2 score is :  0.6060680302702346








8 th . the obtained validation r2 score is :  0.6531868250852089








9 th . the obtained validation r2 score is :  0.760486150181964








10 th . the obtained validation r2 score is :  0.629853173750996


In [33]:
score_trial3

array([0.69863581, 0.6990361 , 0.69938173, 0.69967269, 0.69990898,
       0.70009061, 0.70021758, 0.70028988, 0.70030752, 0.7002705 ,
       0.70017881, 0.70003246, 0.69983144, 0.69957576, 0.69926541])

In [34]:
weight_trial

[0.4,
 0.43000000000000005,
 0.46,
 0.49,
 0.52,
 0.55,
 0.5800000000000001,
 0.61,
 0.64,
 0.67,
 0.7,
 0.73,
 0.76,
 0.79,
 0.8200000000000001]

In [36]:
score_trial3

array([0.70030772, 0.70030126])

In [64]:
u_trial = [1.7+0.05*i for i in range(0,25)]
y_pred_trial_u = np.zeros((X_test_processed.shape[0],len(u_trial)))
score_trial_u = np.zeros(len(u_trial))

for i in range(0,len(u_trial)):
    score_trial_u[i],y_pred_trial_u[:,i] = score,prediction = train_k_fold_2GP_LGB(X_lgb,X_test_lgb,X_gp_quad,X_test_gp_quad,X_gp_rbf,X_test_gp_rbf, y_processed , weight1 = 0.578, weight2 = 0.64, fold_num=10,l = 0.75, u = u_trial[i])







1 th . the obtained validation r2 score is :  0.7997054250849926








2 th . the obtained validation r2 score is :  0.8067794436749146








3 th . the obtained validation r2 score is :  0.6296157511893967








4 th . the obtained validation r2 score is :  0.7448232613487062








5 th . the obtained validation r2 score is :  0.6775284840996086








6 th . the obtained validation r2 score is :  0.6941138355479036








7 th . the obtained validation r2 score is :  0.6068395335371197








8 th . the obtained validation r2 score is :  0.6537931621035058








9 th . the obtained validation r2 score is :  0.7605146278659938








10 th . the obtained validation r2 score is :  0.6306912291670028








1 th . the obtained validation r2 score is :  0.799777222264287








2 th . the obtained validation r2 score is :  0.8068112424166369








3 th . the obtained validation r2 score is :  0.6293379524668976








4 th . the obtained validation r2 score is :  0.7448213774022643








5 th . the obtained validation r2 score is :  0.6775869779732412








6 th . the obtained validation r2 score is :  0.6940242277312433








7 th . the obtained validation r2 score is :  0.6069508781675096








8 th . the obtained validation r2 score is :  0.6538659804287221








9 th . the obtained validation r2 score is :  0.7605145599275327








10 th . the obtained validation r2 score is :  0.6308981432671407








1 th . the obtained validation r2 score is :  0.7998430370541418








2 th . the obtained validation r2 score is :  0.806837885702475






ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)




ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)


3 th . the obtained validation r2 score is :  0.6290679518302807








4 th . the obtained validation r2 score is :  0.7448138640743699








5 th . the obtained validation r2 score is :  0.6776376278940983








6 th . the obtained validation r2 score is :  0.6939353394034702






ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)




ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)


7 th . the obtained validation r2 score is :  0.6070569041294998








8 th . the obtained validation r2 score is :  0.6539312042877732








9 th . the obtained validation r2 score is :  0.7605121894708652








10 th . the obtained validation r2 score is :  0.6310901635174125








1 th . the obtained validation r2 score is :  0.7999034809100537








2 th . the obtained validation r2 score is :  0.8068599370587535








3 th . the obtained validation r2 score is :  0.6288056374605082








4 th . the obtained validation r2 score is :  0.7448013719655071








5 th . the obtained validation r2 score is :  0.6776812044404065








6 th . the obtained validation r2 score is :  0.6938472694536211








7 th . the obtained validation r2 score is :  0.6071579608656961








8 th . the obtained validation r2 score is :  0.6539895146497378








9 th . the obtained validation r2 score is :  0.7605077506638875








10 th . the obtained validation r2 score is :  0.6312685198461783








1 th . the obtained validation r2 score is :  0.7999590583556713








2 th . the obtained validation r2 score is :  0.8068778686994944








3 th . the obtained validation r2 score is :  0.6285508674714237








4 th . the obtained validation r2 score is :  0.7447844250094207








5 th . the obtained validation r2 score is :  0.6777184342218288








6 th . the obtained validation r2 score is :  0.6937601146913441








7 th . the obtained validation r2 score is :  0.6072543674815127








8 th . the obtained validation r2 score is :  0.6540415521561593








9 th . the obtained validation r2 score is :  0.7605014934856144








10 th . the obtained validation r2 score is :  0.6314343227715649








1 th . the obtained validation r2 score is :  0.800010260033188








2 th . the obtained validation r2 score is :  0.8068920934991346








3 th . the obtained validation r2 score is :  0.6283035025595183








4 th . the obtained validation r2 score is :  0.7447635966994688








5 th . the obtained validation r2 score is :  0.6777499369705522








6 th . the obtained validation r2 score is :  0.6936739421012063








7 th . the obtained validation r2 score is :  0.6073464174892057








8 th . the obtained validation r2 score is :  0.6540880010127078








9 th . the obtained validation r2 score is :  0.7604935834521729








10 th . the obtained validation r2 score is :  0.6315886307759929








1 th . the obtained validation r2 score is :  0.8000574862205766








2 th . the obtained validation r2 score is :  0.8069030488733316








3 th . the obtained validation r2 score is :  0.6280633221701513








4 th . the obtained validation r2 score is :  0.7447392999258478








5 th . the obtained validation r2 score is :  0.6777762692954352








6 th . the obtained validation r2 score is :  0.6935888104476595








7 th . the obtained validation r2 score is :  0.6074343747709176








8 th . the obtained validation r2 score is :  0.6541293577144891








9 th . the obtained validation r2 score is :  0.7604841592836474








10 th . the obtained validation r2 score is :  0.6317323240971133








1 th . the obtained validation r2 score is :  0.8001011383740222








2 th . the obtained validation r2 score is :  0.8069110253060133








3 th . the obtained validation r2 score is :  0.6278301903683869








4 th . the obtained validation r2 score is :  0.7447119574957634








5 th . the obtained validation r2 score is :  0.677797921509278








6 th . the obtained validation r2 score is :  0.693504764814074








7 th . the obtained validation r2 score is :  0.6075184821240462








8 th . the obtained validation r2 score is :  0.6541660968719243








9 th . the obtained validation r2 score is :  0.7604734493256831








10 th . the obtained validation r2 score is :  0.6318662705613516








1 th . the obtained validation r2 score is :  0.8001415179700551








2 th . the obtained validation r2 score is :  0.8069163404912433








3 th . the obtained validation r2 score is :  0.6276038368033217








4 th . the obtained validation r2 score is :  0.7446819213611517








5 th . the obtained validation r2 score is :  0.6778154261400277








6 th . the obtained validation r2 score is :  0.6934218446610693






ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)




ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)


7 th . the obtained validation r2 score is :  0.6075989622365847








8 th . the obtained validation r2 score is :  0.6541986497796028








9 th . the obtained validation r2 score is :  0.7604615947726375








10 th . the obtained validation r2 score is :  0.6319912590564252








1 th . the obtained validation r2 score is :  0.8001789554433025








2 th . the obtained validation r2 score is :  0.8069193120150633








3 th . the obtained validation r2 score is :  0.6273841496820571








4 th . the obtained validation r2 score is :  0.7446495024607105








5 th . the obtained validation r2 score is :  0.6778291639181594








6 th . the obtained validation r2 score is :  0.6933400666310539








7 th . the obtained validation r2 score is :  0.607676019086785








8 th . the obtained validation r2 score is :  0.6542274540510641








9 th . the obtained validation r2 score is :  0.760448676103576








10 th . the obtained validation r2 score is :  0.6321078718305226








1 th . the obtained validation r2 score is :  0.8002136870943738








2 th . the obtained validation r2 score is :  0.8069201049859742








3 th . the obtained validation r2 score is :  0.6271708489590391








4 th . the obtained validation r2 score is :  0.7446149831076332








5 th . the obtained validation r2 score is :  0.6778393736376737








6 th . the obtained validation r2 score is :  0.6932594605494111








7 th . the obtained validation r2 score is :  0.6077498423244043








8 th . the obtained validation r2 score is :  0.6542527905882991








9 th . the obtained validation r2 score is :  0.760434815087965








10 th . the obtained validation r2 score is :  0.632216828531456








1 th . the obtained validation r2 score is :  0.8002459888418407








2 th . the obtained validation r2 score is :  0.8069190571134834








3 th . the obtained validation r2 score is :  0.6269637612646867








4 th . the obtained validation r2 score is :  0.7445786370402576








5 th . the obtained validation r2 score is :  0.6778465487305747






ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)




ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)


6 th . the obtained validation r2 score is :  0.6931800396726516








7 th . the obtained validation r2 score is :  0.6078206106790631








8 th . the obtained validation r2 score is :  0.654275067386378








9 th . the obtained validation r2 score is :  0.7604201464438534








10 th . the obtained validation r2 score is :  0.6323187181131942








1 th . the obtained validation r2 score is :  0.8002760103667228








2 th . the obtained validation r2 score is :  0.8069162447767197








3 th . the obtained validation r2 score is :  0.6267626892925691








4 th . the obtained validation r2 score is :  0.7445406859852378








5 th . the obtained validation r2 score is :  0.6778509319775401








6 th . the obtained validation r2 score is :  0.6931018042148869








7 th . the obtained validation r2 score is :  0.607888477901563








8 th . the obtained validation r2 score is :  0.6542944711961051








9 th . the obtained validation r2 score is :  0.7604047560091399








10 th . the obtained validation r2 score is :  0.6324140113790582








1 th . the obtained validation r2 score is :  0.8003039557428353








2 th . the obtained validation r2 score is :  0.8069119141329726








3 th . the obtained validation r2 score is :  0.6265674141043767








4 th . the obtained validation r2 score is :  0.7445013200446398








5 th . the obtained validation r2 score is :  0.6778527605126141








6 th . the obtained validation r2 score is :  0.6930247689994746








7 th . the obtained validation r2 score is :  0.6079535999881832








8 th . the obtained validation r2 score is :  0.654311341046321








9 th . the obtained validation r2 score is :  0.7603887014046625








10 th . the obtained validation r2 score is :  0.6325032105836335








1 th . the obtained validation r2 score is :  0.8003300731589738








2 th . the obtained validation r2 score is :  0.8069061996449111








3 th . the obtained validation r2 score is :  0.6263777464590389








4 th . the obtained validation r2 score is :  0.7444607610724612








5 th . the obtained validation r2 score is :  0.6778523492797319








6 th . the obtained validation r2 score is :  0.6929489208847767








7 th . the obtained validation r2 score is :  0.608016114493499








8 th . the obtained validation r2 score is :  0.6543258248156582








9 th . the obtained validation r2 score is :  0.7603720527930469








10 th . the obtained validation r2 score is :  0.6325867796485507








1 th . the obtained validation r2 score is :  0.8003544538224018








2 th . the obtained validation r2 score is :  0.8068992608034574








3 th . the obtained validation r2 score is :  0.6261934945948077








4 th . the obtained validation r2 score is :  0.7444191342927671








5 th . the obtained validation r2 score is :  0.6778498127044555








6 th . the obtained validation r2 score is :  0.6928742734991822








7 th . the obtained validation r2 score is :  0.6080761530026579








8 th . the obtained validation r2 score is :  0.6543381919557468






ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)




ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)


9 th . the obtained validation r2 score is :  0.7603548917572928








10 th . the obtained validation r2 score is :  0.6326651022139864








1 th . the obtained validation r2 score is :  0.8003772346610782








2 th . the obtained validation r2 score is :  0.8068912241050359








3 th . the obtained validation r2 score is :  0.6260144631785529








4 th . the obtained validation r2 score is :  0.7443766179893043








5 th . the obtained validation r2 score is :  0.6778454269334584








6 th . the obtained validation r2 score is :  0.6928008048042675








7 th . the obtained validation r2 score is :  0.608133839845173








8 th . the obtained validation r2 score is :  0.6543486268064024








9 th . the obtained validation r2 score is :  0.7603373053624749








10 th . the obtained validation r2 score is :  0.6327385160929484








1 th . the obtained validation r2 score is :  0.80039857045288








2 th . the obtained validation r2 score is :  0.8068822190816355








3 th . the obtained validation r2 score is :  0.6258404733196666








4 th . the obtained validation r2 score is :  0.7443333277674804








5 th . the obtained validation r2 score is :  0.6778393909890048








6 th . the obtained validation r2 score is :  0.6927285166542961






ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)




ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)


7 th . the obtained validation r2 score is :  0.6081892834830228








8 th . the obtained validation r2 score is :  0.6543572965718454








9 th . the obtained validation r2 score is :  0.7603193036807377








10 th . the obtained validation r2 score is :  0.632807412210924








1 th . the obtained validation r2 score is :  0.800418555601197








2 th . the obtained validation r2 score is :  0.8068723236034547








3 th . the obtained validation r2 score is :  0.6256713299354497








4 th . the obtained validation r2 score is :  0.744289390051257








5 th . the obtained validation r2 score is :  0.677831744699763








6 th . the obtained validation r2 score is :  0.6926573834653771








7 th . the obtained validation r2 score is :  0.6082425959913393








8 th . the obtained validation r2 score is :  0.6543643449154868








9 th . the obtained validation r2 score is :  0.7603009581665608








10 th . the obtained validation r2 score is :  0.6328720669291753








1 th . the obtained validation r2 score is :  0.8004372981016012








2 th . the obtained validation r2 score is :  0.8068616532136448








3 th . the obtained validation r2 score is :  0.6255068782689683








4 th . the obtained validation r2 score is :  0.744244904328366






ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)




ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)


5 th . the obtained validation r2 score is :  0.6778227660391469








6 th . the obtained validation r2 score is :  0.6925874107288776








7 th . the obtained validation r2 score is :  0.6082938753707519








8 th . the obtained validation r2 score is :  0.6543699612491016








9 th . the obtained validation r2 score is :  0.7602823463776591








10 th . the obtained validation r2 score is :  0.6329327916841347








1 th . the obtained validation r2 score is :  0.8004549096486422








2 th . the obtained validation r2 score is :  0.80685026458899








3 th . the obtained validation r2 score is :  0.6253469339410354








4 th . the obtained validation r2 score is :  0.7442000055679232








5 th . the obtained validation r2 score is :  0.6778125790403859








6 th . the obtained validation r2 score is :  0.6925185722202465








7 th . the obtained validation r2 score is :  0.6083432144324479








8 th . the obtained validation r2 score is :  0.6543742210100709








9 th . the obtained validation r2 score is :  0.7602634281310691








10 th . the obtained validation r2 score is :  0.6329898473554467








1 th . the obtained validation r2 score is :  0.8004714677610927








2 th . the obtained validation r2 score is :  0.806838296864772








3 th . the obtained validation r2 score is :  0.6251913537366904








4 th . the obtained validation r2 score is :  0.7441547255029419








5 th . the obtained validation r2 score is :  0.6778012773721491








6 th . the obtained validation r2 score is :  0.6924508610140876








7 th . the obtained validation r2 score is :  0.6083907058238667








8 th . the obtained validation r2 score is :  0.6543772598220402








9 th . the obtained validation r2 score is :  0.7602443215928699








10 th . the obtained validation r2 score is :  0.6330434759463796








1 th . the obtained validation r2 score is :  0.8004870329358305








2 th . the obtained validation r2 score is :  0.8068257267011401








3 th . the obtained validation r2 score is :  0.6250399821606731








4 th . the obtained validation r2 score is :  0.7441091551777725








5 th . the obtained validation r2 score is :  0.6777889241836413








6 th . the obtained validation r2 score is :  0.6923842574115702








7 th . the obtained validation r2 score is :  0.6084364312383368








8 th . the obtained validation r2 score is :  0.6543792017897527








9 th . the obtained validation r2 score is :  0.7602250206588469








10 th . the obtained validation r2 score is :  0.633093902803056








1 th . the obtained validation r2 score is :  0.8005017108534964








2 th . the obtained validation r2 score is :  0.8068127431920468








3 th . the obtained validation r2 score is :  0.6248926378623545








4 th . the obtained validation r2 score is :  0.7440634295041284








5 th . the obtained validation r2 score is :  0.6777756803197879








6 th . the obtained validation r2 score is :  0.6923187309932675








7 th . the obtained validation r2 score is :  0.6084804636501912








8 th . the obtained validation r2 score is :  0.6543801618222038






ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)




ABNORMAL_TERMINATION_IN_LNSRCH.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  _check_optimize_result("lbfgs", opt_res)


9 th . the obtained validation r2 score is :  0.7602055644333328








10 th . the obtained validation r2 score is :  0.6331413345160739








1 th . the obtained validation r2 score is :  0.8005155398634458








2 th . the obtained validation r2 score is :  0.8067992922922671








3 th . the obtained validation r2 score is :  0.6247492105248867








4 th . the obtained validation r2 score is :  0.7440175214140698








5 th . the obtained validation r2 score is :  0.6777616244328042








6 th . the obtained validation r2 score is :  0.6922543089092305








7 th . the obtained validation r2 score is :  0.6085228823106024








8 th . the obtained validation r2 score is :  0.6543801715192552








9 th . the obtained validation r2 score is :  0.7601859829001082








10 th . the obtained validation r2 score is :  0.6331859983653738


In [66]:
score_trial_u

array([0.70044048, 0.70045886, 0.70047262, 0.70048226, 0.70048825,
       0.700491  , 0.70049085, 0.70048813, 0.70048314, 0.70047612,
       0.70046727, 0.70045686, 0.70044501, 0.7004319 , 0.70041768,
       0.70040248, 0.70038641, 0.70036958, 0.70035207, 0.70033399,
       0.7003154 , 0.70029637, 0.70027696, 0.70025725, 0.70023725])

In [67]:
u_trial

[1.7,
 1.75,
 1.8,
 1.85,
 1.9,
 1.95,
 2.0,
 2.05,
 2.1,
 2.15,
 2.2,
 2.25,
 2.3,
 2.35,
 2.4,
 2.45,
 2.5,
 2.55,
 2.6,
 2.65,
 2.7,
 2.75,
 2.8,
 2.85,
 2.9000000000000004]

In [None]:
score,y_pred = train_k_fold_2GP_LGB(X_lgb,X_test_lgb,X_gp_quad,X_test_gp_quad,X_gp_rbf,X_test_gp_rbf, y_processed , weight1 = 0.578, weight2 = 0.64, fold_num=20,l = 0.9, u = 2.0)







1 th . the obtained validation r2 score is :  0.820858127402781








2 th . the obtained validation r2 score is :  0.7134513840694123








3 th . the obtained validation r2 score is :  0.7303520875922525








4 th . the obtained validation r2 score is :  0.7021591781329879








5 th . the obtained validation r2 score is :  0.6988122115772255








6 th . the obtained validation r2 score is :  0.53739542488767








7 th . the obtained validation r2 score is :  0.6761526590719162








8 th . the obtained validation r2 score is :  0.6078886551282728










In [76]:
score

0.6974230433625703

In [77]:
final_res = np.vstack((indices_test, y_pred)).T
df_res = pd.DataFrame(final_res)
df_res.to_csv("our_result_0.697.csv", header = ["id", "y"], index=False)