## Libraries import

In [1]:
import os
import glob
import random
import numpy as np
import pandas as pd
import lightgbm as lgb
from sklearn.model_selection import KFold, GroupKFold, cross_val_score

In [2]:
SEED = 42
random.seed(SEED)
np.random.seed(SEED)

In [3]:
numFolds = 5

In [4]:
feature_dir = "referencePublicNotebooks/500Features"

In [5]:
# the metric used in this competition
def comp_metric(xhat, yhat, fhat, x, y, f):
    intermediate = np.sqrt(np.power(xhat - x,2) + np.power(yhat-y,2)) + 15 * np.abs(fhat-f)
    return intermediate.sum()/xhat.shape[0]

# get our train and test files
train_files = sorted(glob.glob(os.path.join(feature_dir, 'train/*_train.csv')))
test_files = sorted(glob.glob(os.path.join(feature_dir, 'test/*_test.csv')))
ssubm = pd.read_csv('sample_submission.csv', index_col=0)

In [6]:
len(train_files),len(test_files)

(24, 24)

In [7]:
e = 0
data = pd.read_csv(train_files[0], index_col=0)
test_data = pd.read_csv(test_files[e], index_col=0)
print(data.shape, test_data.shape)

(9296, 1655) (299, 1652)


In [8]:
x_train = data.iloc[:,:-4]
y_trainy = data.iloc[:,-3]
y_trainx = data.iloc[:,-4]
y_trainf = data.iloc[:,-2]

In [9]:
kfold = KFold(n_splits=numFolds, random_state=SEED, shuffle=True)
modely = lgb.LGBMRegressor(n_estimators=125, num_leaves=90)
modelx = lgb.LGBMRegressor(n_estimators=125, num_leaves=90)
modelf = lgb.LGBMClassifier(n_estimators=125, num_leaves=90)

In [10]:
results = cross_val_score(modely, x_train, y_trainy, cv=kfold)
print(f"Cross val score for y coordinate is {results}")

Cross val score for y coordinate is [0.99514769 0.99598623 0.99527829 0.99353552 0.99519227]


In [11]:
results = cross_val_score(modely, x_train, y_trainx, cv=kfold)
print(f"Cross val score for x coordinate is {results}")

Cross val score for x coordinate is [0.99118581 0.99413059 0.99269703 0.9927723  0.99332617]


In [12]:
results = cross_val_score(modely, x_train, y_trainf, cv=kfold)
print(f"Cross val score for floor is {results}")

Cross val score for floor is [0.99663275 0.99815239 0.99717767 0.99790664 0.99739433]
