In [25]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error, r2_score

In [2]:
df = pd.read_csv('airbnb_listing_train.csv')
df.head()

Unnamed: 0,id,name,host_id,host_name,neighbourhood_group,neighbourhood,latitude,longitude,room_type,minimum_nights,number_of_reviews,last_review,reviews_per_month,calculated_host_listings_count,availability_365,price
0,11602914,Luxury home 100m2+garden in center!,3123809,Marjolein,,De Pijp - Rivierenbuurt,52.35368,4.90177,Entire home/apt,3,13,15-02-2020,0.27,1,0,220
1,13289321,East is where your home is!,10259430,Ana,,Oud-Oost,52.35728,4.92052,Entire home/apt,4,14,19-06-2019,0.29,1,0,110
2,40779315,Amsterdam Central - LUXURY house in BUSY STREET,224969266,Mark,,Centrum-West,52.37582,4.8985,Entire home/apt,2,9,16-03-2020,1.65,1,7,100
3,7820311,great appartment down town,693472,Ayden,,Westerpark,52.37792,4.873,Entire home/apt,3,42,17-02-2020,0.72,1,0,130
4,27346603,Private room with canal view in peaceful area,41888346,Alissa,,Westerpark,52.38051,4.87493,Private room,2,89,26-02-2020,4.02,1,24,90


# About the Data

>The code competition data set can be found below. There are 3 different data sets available:

* **airbnb_listing_train.csv:** this data set can be used to build and test your model. It contains all the variables including the variable that has to be predicted i.e. price. This dataset contains 12901 observations/records divided into 16 columns (including the target column - 'price')
* **airbnb_listing_validate.csv:** this data set should be used to create the submissions. The data set contains all the variables that are also in the train data set except for the 'price'.
* **sample_submission.csv:** this is an example of what your submissions should look like. Note that there are no automatic checks performed on your uploaded file so make sure that your submission file matches this file perfectly. Also, note that the order in which observations are presented in the validation set must be preserved when delivering predictions.

>The data sets have not been cleaned since this is an important step in creating a predictive model. Note also that there are many opportunities to engineer your own features. It is allowed to merge your data with other online data as long as you can make sure that your model also works on the validation data. Note also that the data sets are large so be aware of overfitting your models.
Feature Description


* id: The id of each lodge/home/listing
* name: The name/description of the lodge/home
* host_id: The id of the host
* host_name: Name of the host
* neighbourhood: Name of the neighbourhood place
* neighbourhood_group: Group in the neighbourhood
* latitude: Latitude of the location
* longitude: Longitude of the location
* room_type: Type of the room that consumer booked, for example, private room or an entire home, etc.
* minimum_nights: The minimum number of nights customer will stay
* number_of_reviews: Number of reviews given to the lodge/home
* last_review: The date of the last review given to the lodge/home
* reviews_per_month: Average reviews per month
* calculated_host_listings_count: The count of the listing that each host has
* availability_365: The number of days (out of 365 days) for which lodge/home is available
* price: Price for the lodging/homestays in USD - the target variable

In [3]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 12901 entries, 0 to 12900
Data columns (total 16 columns):
 #   Column                          Non-Null Count  Dtype  
---  ------                          --------------  -----  
 0   id                              12901 non-null  int64  
 1   name                            12879 non-null  object 
 2   host_id                         12901 non-null  int64  
 3   host_name                       12893 non-null  object 
 4   neighbourhood_group             0 non-null      float64
 5   neighbourhood                   12901 non-null  object 
 6   latitude                        12901 non-null  float64
 7   longitude                       12901 non-null  float64
 8   room_type                       12901 non-null  object 
 9   minimum_nights                  12901 non-null  int64  
 10  number_of_reviews               12901 non-null  int64  
 11  last_review                     11305 non-null  object 
 12  reviews_per_month               

In [9]:
df.describe()

Unnamed: 0,id,host_id,neighbourhood_group,latitude,longitude,minimum_nights,number_of_reviews,reviews_per_month,calculated_host_listings_count,availability_365,price
count,12901.0,12901.0,0.0,12901.0,12901.0,12901.0,12901.0,11305.0,12901.0,12901.0,12901.0
mean,19849230.0,63217000.0,,52.365313,4.889744,3.542516,24.803194,0.748501,2.136501,61.392295,166.959538
std,12162410.0,80108140.0,,0.016418,0.036016,15.154077,53.406134,1.260791,6.001838,107.988329,234.79463
min,20168.0,3592.0,,52.28927,4.75572,1.0,0.0,0.01,1.0,0.0,6.0
25%,9869642.0,8948269.0,,52.35519,4.86395,2.0,2.0,0.18,1.0,0.0,99.0
50%,18749390.0,27116010.0,,52.36457,4.88713,2.0,9.0,0.38,1.0,0.0,135.0
75%,29142320.0,83376860.0,,52.37511,4.90931,3.0,24.0,0.77,1.0,87.0,190.0
max,43709000.0,349017500.0,,52.42509,5.0184,1001.0,843.0,50.0,78.0,365.0,9000.0


In [None]:
df2 = df.drop(['id', 'name', 'host_id', 'host_name', 'neighbourhood_group', 'last_review'], axis = 1)
df2.head()

In [10]:
df2.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 12901 entries, 0 to 12900
Data columns (total 10 columns):
 #   Column                          Non-Null Count  Dtype  
---  ------                          --------------  -----  
 0   neighbourhood                   12901 non-null  object 
 1   latitude                        12901 non-null  float64
 2   longitude                       12901 non-null  float64
 3   room_type                       12901 non-null  object 
 4   minimum_nights                  12901 non-null  int64  
 5   number_of_reviews               12901 non-null  int64  
 6   reviews_per_month               11305 non-null  float64
 7   calculated_host_listings_count  12901 non-null  int64  
 8   availability_365                12901 non-null  int64  
 9   price                           12901 non-null  int64  
dtypes: float64(3), int64(5), object(2)
memory usage: 1008.0+ KB


In [11]:
df3 = df2.copy()
df3.reviews_per_month.fillna(df3['reviews_per_month'].mean(), inplace=True)

In [None]:
print(df2.neighbourhood.value_counts())
print('\n')
print(df2.room_type.value_counts())
print('\n')
print(df2.calculated_host_listings_count.value_counts())

In [None]:
df[(df['last_review'].isnull()) & (df['reviews_per_month'].isnull())]

In [21]:
df4 = pd.get_dummies(data = df3, columns = ['neighbourhood', 'room_type'])
df4.head()

Unnamed: 0,latitude,longitude,minimum_nights,number_of_reviews,reviews_per_month,calculated_host_listings_count,availability_365,price,neighbourhood_Bijlmer-Centrum,neighbourhood_Bijlmer-Oost,...,neighbourhood_Oud-Noord,neighbourhood_Oud-Oost,neighbourhood_Slotervaart,neighbourhood_Watergraafsmeer,neighbourhood_Westerpark,neighbourhood_Zuid,room_type_Entire home/apt,room_type_Hotel room,room_type_Private room,room_type_Shared room
0,52.35368,4.90177,3,13,0.27,1,0,220,0,0,...,0,0,0,0,0,0,1,0,0,0
1,52.35728,4.92052,4,14,0.29,1,0,110,0,0,...,0,1,0,0,0,0,1,0,0,0
2,52.37582,4.8985,2,9,1.65,1,7,100,0,0,...,0,0,0,0,0,0,1,0,0,0
3,52.37792,4.873,3,42,0.72,1,0,130,0,0,...,0,0,0,0,1,0,1,0,0,0
4,52.38051,4.87493,2,89,4.02,1,24,90,0,0,...,0,0,0,0,1,0,0,0,1,0


In [None]:
df4.info()

In [23]:
X = df4.drop(columns = ['price'])
y = df4.price

In [70]:
from sklearn import preprocessing

x = X.values #returns a numpy array
min_max_scaler = preprocessing.MinMaxScaler()
x_scaled = min_max_scaler.fit_transform(x)
df5 = pd.DataFrame(x_scaled)

In [74]:
#df5.head()

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,23,24,25,26,27,28,29,30,31,32
0,0.474231,0.556,0.002,0.015421,0.005201,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0
1,0.500736,0.627379,0.003,0.016607,0.005601,0.0,0.0,0.0,0.0,0.0,...,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0
2,0.63724,0.543551,0.001,0.010676,0.032807,0.0,0.019178,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0
3,0.652702,0.446475,0.002,0.049822,0.014203,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0
4,0.671771,0.453822,0.001,0.105575,0.080216,0.0,0.065753,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0


In [223]:
X_train,X_test,y_train,y_test = train_test_split(X,y,test_size = 0.2, random_state = 42)

In [27]:
from sklearn.linear_model import LinearRegression

In [31]:
lr = LinearRegression()
lr.fit(X_train, y_train)

lr_pred = lr.predict(X_test)

mse_lr = mean_squared_error(y_test, lr_pred)
r2_lr = r2_score(y_test, lr_pred)
#mae_lr = mean_absolute_error(y_test, lr_pred)
rmse_lr = (np.sqrt(mean_squared_error(y_test, lr_pred)))
#print("MAE of the LR model is: {}".format(mae_lr))
print("MSE of the LR model is: {}".format(mse_lr))
print("R2 score of the LR model is: {}".format(r2_lr))
print("RMSE of the LR model is: {}".format(rmse_lr))

MSE of the LR model is: 42504.106397464835
R2 score of the LR model is: 0.04742644013588537
RMSE of the LR model is: 206.16524051707853


In [41]:
from sklearn.tree import DecisionTreeRegressor
dtr = DecisionTreeRegressor(max_depth=6, max_features='auto', random_state=53)
dtr.fit(X_train, y_train)

dtr_pred = dtr.predict(X_test)

#mae_dtr = mean_absolute_error(y_test, dtr_pred)
mse_dtr = mean_squared_error(y_test, dtr_pred)
r2_dtr = r2_score(y_test, dtr_pred)
rmse_dtr = (np.sqrt(mean_squared_error(y_test, dtr_pred)))
#print("MAE of the DTR model is: {}".format(mae_lr))
print("MSE of the DTR model is: {}".format(mse_dtr))
print("R2 score of the DTR model is: {}".format(r2_dtr))
print("RMSE of the DTR model is: {}".format(rmse_dtr))

MSE of the DTR model is: 36287.567376814775
R2 score of the DTR model is: 0.1867473483220179
RMSE of the DTR model is: 190.49295886413958


In [42]:
from sklearn.ensemble import RandomForestRegressor

In [108]:
rfr = RandomForestRegressor(max_depth=8, random_state=42) #(max_depth=6, max_features='auto', random_state=42)
rfr.fit(X_train, y_train)

RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',
                      max_depth=8, max_features='auto', max_leaf_nodes=None,
                      max_samples=None, min_impurity_decrease=0.0,
                      min_impurity_split=None, min_samples_leaf=1,
                      min_samples_split=2, min_weight_fraction_leaf=0.0,
                      n_estimators=100, n_jobs=None, oob_score=False,
                      random_state=42, verbose=0, warm_start=False)

In [109]:
rfr_pred = rfr.predict(X_test)

#mae_rfr = mean_absolute_error(y_test, rfr_pred)
mse_rfr = mean_squared_error(y_test, rfr_pred)
r2_rfr = r2_score(y_test, rfr_pred)
rmse_rfr = (np.sqrt(mean_squared_error(y_test, rfr_pred)))
#print("MAE of the RFR model is: {}".format(mae_rfr))
print("MSE of the RFR model is: {}".format(mse_rfr))
print("R2 score of the RFR model is: {}".format(r2_rfr))
print("RMSE of the RFR model is: {}".format(rmse_rfr))

MSE of the RFR model is: 34968.145877285686
R2 score of the RFR model is: 0.2884468113085118
RMSE of the RFR model is: 186.99771623548156


In [None]:
!pip install optuna

In [None]:
import optuna

# def objective(trial):
#     rf_max_depth = trial.suggest_int('rf_max_depth', 2, 12)
#     regressor_obj = RandomForestRegressor(max_depth=rf_max_depth)

#     regressor_obj.fit(X_train, y_train)
#     y_pred = regressor_obj.predict(X_test)

#     error = (np.sqrt(mean_squared_error(y_test, y_pred)))

#     return error

# study = optuna.create_study()
# study.optimize(objective, n_trials=20)
# print(study.best_trial)

In [234]:
from xgboost import XGBRegressor

xgb_model = XGBRegressor(max_depth=6, learning_rate = 0.355) #0.2777) #0.34410) #0.264145) #0.26122) #0.35125) 
xgb_model.fit(X_train, y_train)

XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,
             colsample_bynode=1, colsample_bytree=1, gamma=0, gpu_id=-1,
             importance_type='gain', interaction_constraints='',
             learning_rate=0.355, max_delta_step=0, max_depth=6,
             min_child_weight=1, missing=nan, monotone_constraints='()',
             n_estimators=100, n_jobs=0, num_parallel_tree=1,
             objective='reg:squarederror', random_state=0, reg_alpha=0,
             reg_lambda=1, scale_pos_weight=1, subsample=1, tree_method='exact',
             validate_parameters=1, verbosity=None)

In [235]:
xgb_pred = xgb_model.predict(X_test)

#mae_xgb = mean_absolute_error(y_test, xgb_pred)
mse_xgb = mean_squared_error(y_test, xgb_pred)
r2_xgb = r2_score(y_test, xgb_pred)
rmse_xgb = (np.sqrt(mean_squared_error(y_test, xgb_pred)))
#print("MAE of the XGB model is: {}".format(mae_xgb))
print("MSE of the XGB model is: {}".format(mse_xgb))
print("R2 score of the XGB model is: {}".format(r2_xgb))
print("RMSE of the XGB model is: {}".format(rmse_xgb))

MSE of the XGB model is: 31849.245250920692
R2 score of the XGB model is: 0.23709355886305938
RMSE of the XGB model is: 178.463568413614


In [229]:
import xgboost as xgb

def objective(trial):
    
    dtrain = xgb.DMatrix(X_train, label=y_train)
    dvalid = xgb.DMatrix(X_test, label=y_test)
    
    param = {
        "max_depth" : trial.suggest_int("max_depth", 4, 6),
        "lr_rate" : trial.suggest_float("lr_rate", 0.2, 0.4)
    }

    bst = xgb.train(param, dtrain)
    preds = bst.predict(dvalid)
    predics = np.rint(preds)
    
    error = (np.sqrt(mean_squared_error(y_test, predics)))

    return error

study = optuna.create_study()
study.optimize(objective, n_trials=100)
print(study.best_trial)

Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:08,987] Trial 0 finished with value: 186.79683773149054 and parameters: {'max_depth': 4, 'lr_rate': 0.21750561465896734}. Best is trial 0 with value: 186.79683773149054.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:09,159] Trial 1 finished with value: 182.5297324377773 and parameters: {'max_depth': 6, 'lr_rate': 0.22780901154216637}. Best is trial 1 with value: 182.5297324377773.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:09,315] Trial 2 finished with value: 182.5297324377773 and parameters: {'max_depth': 6, 'lr_rate': 0.2048424024666599}. Best is trial 1 with value: 182.5297324377773.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:09,471] Trial 3 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.25383180265157096}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:09,612] Trial 4 finished with value: 186.79683773149054 and parameters: {'max_depth': 4, 'lr_rate': 0.2360955536290711}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:09,762] Trial 5 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.38254726523222754}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:09,902] Trial 6 finished with value: 186.79683773149054 and parameters: {'max_depth': 4, 'lr_rate': 0.22788906946689313}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:10,052] Trial 7 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2391490642183435}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:10,207] Trial 8 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.33042858107330075}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:10,376] Trial 9 finished with value: 182.5297324377773 and parameters: {'max_depth': 6, 'lr_rate': 0.3570635344742513}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:10,537] Trial 10 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2818696639608368}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:10,692] Trial 11 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3956640286662092}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:10,842] Trial 12 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.27886702436024846}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:10,993] Trial 13 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3863645131597803}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:11,164] Trial 14 finished with value: 182.5297324377773 and parameters: {'max_depth': 6, 'lr_rate': 0.3143160463218653}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:11,304] Trial 15 finished with value: 186.79683773149054 and parameters: {'max_depth': 4, 'lr_rate': 0.2585063332263387}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:11,470] Trial 16 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.35502762363917406}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:11,626] Trial 17 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.32676992619232065}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:11,772] Trial 18 finished with value: 186.79683773149054 and parameters: {'max_depth': 4, 'lr_rate': 0.3464891134500066}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:11,947] Trial 19 finished with value: 182.5297324377773 and parameters: {'max_depth': 6, 'lr_rate': 0.2925971762158308}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:12,106] Trial 20 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3666546072103447}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:12,297] Trial 21 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3156854815512815}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:12,492] Trial 22 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.28900971748570653}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:12,658] Trial 23 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3956788219489109}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:12,820] Trial 24 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.37543967000342765}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:13,019] Trial 25 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.26795660603802457}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:13,165] Trial 26 finished with value: 186.79683773149054 and parameters: {'max_depth': 4, 'lr_rate': 0.28152173116891743}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:13,333] Trial 27 finished with value: 182.5297324377773 and parameters: {'max_depth': 6, 'lr_rate': 0.3115433325375395}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:13,493] Trial 28 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.373494326766628}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:13,627] Trial 29 finished with value: 186.79683773149054 and parameters: {'max_depth': 4, 'lr_rate': 0.3693765132288415}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:13,780] Trial 30 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.39998685720324445}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:13,951] Trial 31 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.30236281471276893}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:14,101] Trial 32 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.29900023414156385}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:14,244] Trial 33 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.35275390606077267}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:14,404] Trial 34 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.39762065399389845}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:14,565] Trial 35 finished with value: 182.5297324377773 and parameters: {'max_depth': 6, 'lr_rate': 0.3322246663490961}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:14,715] Trial 36 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3681155165435116}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:14,865] Trial 37 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2649024246301075}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:15,024] Trial 38 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.261374684366856}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:15,175] Trial 39 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.24348612987584842}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:15,337] Trial 40 finished with value: 182.5297324377773 and parameters: {'max_depth': 6, 'lr_rate': 0.24894896620597606}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:15,488] Trial 41 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.38768311686149887}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:15,646] Trial 42 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3781679620165868}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:15,800] Trial 43 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.27738736439869177}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:15,951] Trial 44 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2121701933957269}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:16,105] Trial 45 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.26995070918540165}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:16,240] Trial 46 finished with value: 186.79683773149054 and parameters: {'max_depth': 4, 'lr_rate': 0.2179941772659948}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:16,390] Trial 47 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.29121916875428067}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:16,550] Trial 48 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.39641186236860393}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:16,700] Trial 49 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.34345949082188487}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:16,851] Trial 50 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3787289771598885}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:17,011] Trial 51 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3611707258804173}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:17,161] Trial 52 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.30292238141773586}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:17,322] Trial 53 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3884760024493892}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:17,485] Trial 54 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3861448529180686}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:17,649] Trial 55 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.31910174571703703}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:17,800] Trial 56 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.27104746506835153}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:17,952] Trial 57 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.30266590754319506}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:18,104] Trial 58 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3456765712754726}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:18,254] Trial 59 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3055070202997147}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:18,412] Trial 60 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.38801816370548975}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:18,564] Trial 61 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3996815413573171}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:18,725] Trial 62 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2562288773997523}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:18,875] Trial 63 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3374640651758068}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:19,043] Trial 64 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.26168052996720725}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:19,193] Trial 65 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.238950388167775}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:19,346] Trial 66 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.24499500903920696}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:19,496] Trial 67 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2280763187879299}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:19,647] Trial 68 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.35693720735136064}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:19,797] Trial 69 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.23060267333530615}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:19,946] Trial 70 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.24837751225370872}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:20,097] Trial 71 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2976419127568985}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:20,256] Trial 72 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.297270710241598}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:20,408] Trial 73 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.20267521407036157}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:20,558] Trial 74 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3665677648754198}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:20,718] Trial 75 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.39097055281611276}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:20,878] Trial 76 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.38118417189638226}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:21,028] Trial 77 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.361191611358784}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:21,186] Trial 78 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.32254347595209165}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:21,348] Trial 79 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3178127400585408}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:21,499] Trial 80 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3112536790428716}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:21,657] Trial 81 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2459402870418222}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:21,809] Trial 82 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.219773821993792}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:21,958] Trial 83 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.38855292662956226}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:22,110] Trial 84 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3842860816747922}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:22,260] Trial 85 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3218450924117304}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:22,420] Trial 86 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3052932224550648}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:22,570] Trial 87 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.275446319763522}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:22,721] Trial 88 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2855135139955882}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:22,871] Trial 89 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.3343132899624938}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:23,033] Trial 90 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.21154467965419974}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:23,181] Trial 91 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2560857585713546}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:23,332] Trial 92 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2344733743432349}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:23,492] Trial 93 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.31139945806067504}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:23,630] Trial 94 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.31039040830589554}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:23,793] Trial 95 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2410918729419539}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:23,943] Trial 96 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2335490690721948}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:24,093] Trial 97 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.22520121499215937}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:24,254] Trial 98 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.2506397070987822}. Best is trial 3 with value: 178.34816740261462.


Parameters: { lr_rate } might not be used.

  This may not be accurate due to some parameters are only used in language bindings but
  passed down to XGBoost core.  Or some parameters are not used but slip through this
  verification. Please open an issue if you find above cases.




[I 2020-07-29 23:08:24,404] Trial 99 finished with value: 178.34816740261462 and parameters: {'max_depth': 5, 'lr_rate': 0.22954546376229876}. Best is trial 3 with value: 178.34816740261462.


FrozenTrial(number=3, value=178.34816740261462, datetime_start=datetime.datetime(2020, 7, 29, 23, 8, 9, 330798), datetime_complete=datetime.datetime(2020, 7, 29, 23, 8, 9, 471107), params={'max_depth': 5, 'lr_rate': 0.25383180265157096}, distributions={'max_depth': IntUniformDistribution(high=6, low=4, step=1), 'lr_rate': UniformDistribution(high=0.4, low=0.2)}, user_attrs={}, system_attrs={}, intermediate_values={}, trial_id=3, state=TrialState.COMPLETE)


In [49]:
test = pd.read_csv('airbnb_listing_validate.csv')

In [50]:
test.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 6451 entries, 0 to 6450
Data columns (total 15 columns):
 #   Column                          Non-Null Count  Dtype  
---  ------                          --------------  -----  
 0   id                              6451 non-null   int64  
 1   name                            6440 non-null   object 
 2   host_id                         6451 non-null   int64  
 3   host_name                       6448 non-null   object 
 4   neighbourhood_group             0 non-null      float64
 5   neighbourhood                   6451 non-null   object 
 6   latitude                        6451 non-null   float64
 7   longitude                       6451 non-null   float64
 8   room_type                       6451 non-null   object 
 9   minimum_nights                  6451 non-null   int64  
 10  number_of_reviews               6451 non-null   int64  
 11  last_review                     5655 non-null   object 
 12  reviews_per_month               56

In [51]:
test2 = test.drop(['name', 'host_id', 'host_name', 'neighbourhood_group', 'last_review'], axis = 1)

In [53]:
test3 = test2.copy()
test3.reviews_per_month.fillna(test3['reviews_per_month'].mean(), inplace=True)

In [54]:
test4 = pd.get_dummies(data = test3, columns = ['neighbourhood', 'room_type'])
test4.head()

Unnamed: 0,id,latitude,longitude,minimum_nights,number_of_reviews,reviews_per_month,calculated_host_listings_count,availability_365,neighbourhood_Bijlmer-Centrum,neighbourhood_Bijlmer-Oost,...,neighbourhood_Oud-Noord,neighbourhood_Oud-Oost,neighbourhood_Slotervaart,neighbourhood_Watergraafsmeer,neighbourhood_Westerpark,neighbourhood_Zuid,room_type_Entire home/apt,room_type_Hotel room,room_type_Private room,room_type_Shared room
0,12297872,52.37326,4.86213,2,49,0.99,1,267,0,0,...,0,0,0,0,0,0,1,0,0,0
1,3920205,52.35076,4.88866,3,34,0.49,38,0,0,0,...,0,0,0,0,0,0,1,0,0,0
2,26614345,52.3898,4.90881,4,3,0.13,1,0,0,0,...,1,0,0,0,0,0,1,0,0,0
3,7433172,52.34292,4.85962,4,0,0.737602,1,0,0,0,...,0,0,0,0,0,1,1,0,0,0
4,17019744,52.37321,4.87238,2,9,0.23,1,0,0,0,...,0,0,0,0,1,0,1,0,0,0


In [55]:
test_this = test4.drop(columns = ['id'])
indx_col = test4.id

In [110]:
rfr_predictions = rfr.predict(test_this)

In [111]:
res = pd.DataFrame(rfr_predictions) 
res.index = indx_col #indexing with id column
res.columns = ["price"]
res.to_csv("prediction_results_rfr_airbnb.csv")

In [58]:
dtr_predictions = dtr.predict(test_this)

In [59]:
res2 = pd.DataFrame(dtr_predictions) 
res2.index = indx_col #indexing with id column
res2.columns = ["price"]
res2.to_csv("prediction_results_dtr_airbnb.csv")

In [227]:
xgb_predictions = xgb_model.predict(test_this)

In [228]:
res3 = pd.DataFrame(xgb_predictions) 
res3.index = indx_col #indexing with id column
res3.columns = ["price"]
res3.to_csv("prediction_results_xgb_airbnb.csv")