In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
%matplotlib inline
pd.set_option('display.max_columns', 500)

In [2]:
test = pd.read_csv('./final_test.csv')
train = pd.read_csv('./final_train.csv')

In [3]:
from sklearn.metrics import mean_squared_error
def rmse(y_true, y_pred):
    return np.sqrt(mean_squared_error(y_true, y_pred))

In [4]:
import xgboost as xgb



In [8]:
prep_X = train.drop(['Unnamed: 0', 'SalePrice'], axis =1)
prep_y = train.SalePrice

In [9]:
prep_test = test.drop(['Unnamed: 0', 'SalePrice'], axis =1)

In [10]:
from sklearn.cross_validation import cross_val_score

In [62]:
def xgBoostCV(max_depth,
            gamma,
            reg_alpha,
            reg_lambda,
            min_child_weight):
    val = cross_val_score(xgb.XGBRegressor(
        max_depth = int(max_depth),
        learning_rate = 0.05,
        n_estimators = 400,
        gamma = float(gamma),
        reg_alpha = float(reg_alpha),
        reg_lambda = float(reg_lambda),
        subsample= 0.5,
        colsample_bytree = 0.7,
        min_child_weight = float(min_child_weight),
        ),
                          prep_X, prep_y, scoring = 'neg_mean_squared_error', 
                          cv = 4, n_jobs =-1).mean()
    return val

In [63]:
baye_par = {
    'max_depth': (5,15),
    'gamma': (.1,10),
    'reg_alpha': (0.001,1),
    'reg_lambda': (0.001,1),
    'min_child_weight': (0.1,40)
    }

In [64]:
from bayes_opt import BayesianOptimization

In [65]:
xgbo = BayesianOptimization(xgBoostCV, baye_par)

In [66]:
xgbo.maximize(n_iter=20)

[31mInitialization[0m
[94m---------------------------------------------------------------------------------------------------------[0m
 Step |   Time |      Value |     gamma |   max_depth |   min_child_weight |   reg_alpha |   reg_lambda | 
    1 | 00m05s | [35m  -0.04988[0m | [32m   6.2237[0m | [32m     9.2419[0m | [32m            1.4667[0m | [32m     0.4075[0m | [32m      0.7976[0m | 
    2 | 00m06s | [35m  -0.03900[0m | [32m   3.9188[0m | [32m    19.1540[0m | [32m            3.2317[0m | [32m     0.4145[0m | [32m      0.9156[0m | 
    3 | 00m04s | [35m  -0.02563[0m | [32m   1.3738[0m | [32m     9.2667[0m | [32m           20.1476[0m | [32m     0.6310[0m | [32m      0.8501[0m | 
    4 | 00m04s |   -0.04970 |    6.0954 |      8.4454 |            28.6072 |      0.4838 |       0.7796 | 
    5 | 00m03s |   -0.03966 |    3.8878 |      7.3910 |            37.1508 |      0.6159 |       0.2346 | 
[31mBayesian Optimization[0m
[94m---------------------



    9 | 00m16s | [35m  -0.01563[0m | [32m   0.1047[0m | [32m    24.9153[0m | [32m           35.2657[0m | [32m     0.0236[0m | [32m      0.6778[0m | 




   10 | 00m15s | [35m  -0.01479[0m | [32m   0.1332[0m | [32m     5.4777[0m | [32m            1.5470[0m | [32m     0.1260[0m | [32m      0.2618[0m | 




   11 | 00m15s |   -0.01572 |    0.1077 |      5.1459 |             0.7607 |      0.5065 |       0.5998 | 


  " state: %s" % convergence_dict)


   12 | 00m14s | [35m  -0.01460[0m | [32m   0.1228[0m | [32m     5.0368[0m | [32m            1.5482[0m | [32m     0.0612[0m | [32m      0.2162[0m | 




   13 | 00m17s |   -0.01482 |    0.1088 |     10.0625 |             0.1957 |      0.1068 |       0.4654 | 


  " state: %s" % convergence_dict)


   14 | 00m16s |   -0.01555 |    0.1571 |      8.2222 |             0.3635 |      0.2913 |       0.0059 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   15 | 00m18s | [35m  -0.01418[0m | [32m   0.1043[0m | [32m    24.1923[0m | [32m           15.5323[0m | [32m     0.0305[0m | [32m      0.4902[0m | 




   16 | 00m20s |   -0.01526 |    0.1534 |     24.3075 |             5.8248 |      0.0269 |       0.0495 | 


  " state: %s" % convergence_dict)


   17 | 00m17s |   -0.01465 |    0.1138 |     10.4046 |             5.2087 |      0.1100 |       0.6508 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   18 | 00m16s |   -0.01447 |    0.1056 |      6.2956 |             3.8098 |      0.0773 |       0.6746 | 




   19 | 00m20s |   -0.01491 |    0.1000 |      9.4832 |             2.1563 |      0.0010 |       0.0010 | 




   20 | 00m17s |   -0.01552 |    0.1038 |     15.2175 |            36.8758 |      0.0357 |       0.8992 | 


  " state: %s" % convergence_dict)


   21 | 00m22s |   -0.01498 |    0.1143 |     24.1505 |             0.5913 |      0.1321 |       0.7415 | 




   22 | 00m20s |   -0.01564 |    0.1735 |     23.9471 |            10.0262 |      0.1537 |       0.9904 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   23 | 00m19s | [35m  -0.01417[0m | [32m   0.1033[0m | [32m    15.6892[0m | [32m           13.5356[0m | [32m     0.0031[0m | [32m      0.9385[0m | 


  " state: %s" % convergence_dict)


   24 | 00m16s |   -0.01628 |    0.1262 |     18.9402 |            39.7499 |      0.1900 |       0.9668 | 


  " state: %s" % convergence_dict)


   25 | 00m15s |   -0.01594 |    0.1274 |      6.5083 |            36.7535 |      0.0645 |       0.8298 | 


  " state: %s" % convergence_dict)


   26 | 00m17s |   -0.01570 |    0.1739 |     22.1054 |            24.0680 |      0.0369 |       0.9733 | 


  " state: %s" % convergence_dict)


   27 | 00m17s |   -0.01502 |    0.1125 |     24.8582 |            19.4828 |      0.1124 |       0.6947 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   28 | 00m15s |   -0.01548 |    0.1095 |      5.9500 |            29.5188 |      0.0400 |       0.4524 | 




   29 | 00m17s |   -0.01475 |    0.1255 |      7.7694 |            11.0978 |      0.0726 |       0.6919 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   30 | 00m18s |   -0.01455 |    0.1000 |      8.4076 |             0.2878 |      0.0010 |       1.0000 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   31 | 00m20s |   -0.01513 |    0.1151 |     18.9777 |             0.3434 |      0.2730 |       0.2359 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   32 | 00m18s |   -0.01470 |    0.1123 |     16.6430 |             9.3850 |      0.1992 |       0.1042 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   33 | 00m18s |   -0.01469 |    0.1217 |     11.5502 |             8.4968 |      0.0026 |       0.7573 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   34 | 00m17s |   -0.01474 |    0.1163 |     20.5062 |            17.9019 |      0.0645 |       0.9410 | 




   35 | 00m17s |   -0.01599 |    0.1521 |     12.3615 |            28.5102 |      0.0111 |       0.9407 | 


  " state: %s" % convergence_dict)


   36 | 00m19s |   -0.01608 |    0.1001 |     23.9297 |             3.1550 |      0.9968 |       0.0509 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   37 | 00m16s |   -0.01556 |    0.1617 |      5.2838 |            18.5936 |      0.0395 |       0.1853 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   38 | 00m17s |   -0.01445 |    0.1004 |     23.2432 |            13.3691 |      0.2996 |       0.0570 | 




   39 | 00m16s |   -0.01488 |    0.1191 |      5.0165 |            18.4637 |      0.0035 |       0.8035 | 


  " state: %s" % convergence_dict)


   40 | 00m16s |   -0.01440 |    0.1212 |      5.2671 |             8.4020 |      0.0240 |       0.9571 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   41 | 00m18s |   -0.01433 |    0.1096 |     21.1532 |            13.4588 |      0.0826 |       0.3299 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   42 | 00m17s |   -0.01633 |    0.1323 |     24.1804 |            39.7726 |      0.0452 |       0.6845 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   43 | 00m16s |   -0.01692 |    0.1864 |      5.0012 |            39.9764 |      0.0293 |       0.3818 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   44 | 00m20s |   -0.01508 |    0.1142 |     14.4965 |             2.1093 |      0.2114 |       0.9948 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   45 | 00m19s |   -0.01465 |    0.1144 |     21.8320 |            15.4301 |      0.0637 |       0.1470 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   46 | 00m21s |   -0.01461 |    0.1035 |     18.2095 |             6.6520 |      0.0075 |       0.6514 | 


  " state: %s" % convergence_dict)


   47 | 00m20s |   -0.01444 |    0.1080 |     23.2475 |            11.2439 |      0.0448 |       0.1529 | 




   48 | 00m16s |   -0.01598 |    0.1517 |     20.8590 |            33.1533 |      0.0489 |       0.8800 | 




   49 | 00m19s |   -0.01439 |    0.1004 |     16.0097 |            13.3889 |      0.0606 |       0.8278 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   50 | 00m20s |   -0.01449 |    0.1211 |     20.6026 |            13.7079 |      0.0527 |       0.9181 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   51 | 00m21s |   -0.01529 |    0.1628 |     15.5381 |            18.2864 |      0.0569 |       0.9577 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   52 | 00m20s |   -0.01471 |    0.1132 |     24.2280 |            14.0558 |      0.2327 |       0.9753 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   53 | 00m20s |   -0.01454 |    0.1084 |     19.9182 |            10.2892 |      0.0264 |       0.1725 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   54 | 00m20s |   -0.01452 |    0.1154 |     19.7518 |            12.6582 |      0.0125 |       0.7864 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   55 | 00m20s |   -0.01465 |    0.1229 |     12.1469 |            14.5788 |      0.0186 |       0.5749 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   56 | 00m18s |   -0.01615 |    0.1126 |     10.7342 |            39.9921 |      0.1578 |       0.4333 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   57 | 00m20s |   -0.01477 |    0.1130 |     20.3784 |            10.5630 |      0.2055 |       0.3239 | 




   58 | 00m22s |   -0.01553 |    0.1599 |     23.8727 |            13.6491 |      0.2703 |       0.3988 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   59 | 00m22s |   -0.01712 |    0.1092 |      8.5156 |            34.8287 |      0.9828 |       0.0913 | 
   60 | 00m18s |   -0.01619 |    0.1356 |      5.1478 |            24.5931 |      0.6400 |       0.8110 | 
   61 | 00m18s |   -0.01499 |    0.1182 |     11.3192 |            21.6797 |      0.0687 |       0.9844 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   62 | 00m20s |   -0.01576 |    0.1029 |     24.2158 |            30.2784 |      0.3310 |       0.0461 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   63 | 00m17s |   -0.01572 |    0.1045 |      5.9663 |            15.0291 |      0.7935 |       0.9552 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   64 | 00m29s |   -0.01485 |    0.1232 |     21.8156 |             1.6051 |      0.0494 |       0.7185 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   65 | 00m24s |   -0.01517 |    0.1041 |     17.3018 |            23.2513 |      0.1118 |       0.1781 | 


  " state: %s" % convergence_dict)


   66 | 00m28s |   -0.01652 |    0.1087 |     18.1025 |            27.2081 |      0.7740 |       0.9004 | 




   67 | 00m24s |   -0.01445 |    0.1000 |     21.3793 |            17.2573 |      0.1082 |       1.0000 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   68 | 00m23s |   -0.01454 |    0.1077 |      6.0590 |            11.4940 |      0.0600 |       0.6826 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   69 | 00m26s |   -0.01499 |    0.1317 |     22.6306 |             3.8260 |      0.1308 |       0.8404 | 


  " state: %s" % convergence_dict)


   70 | 00m28s |   -0.01456 |    0.1144 |     19.2780 |             3.5160 |      0.0052 |       0.9908 | 


  " state: %s" % convergence_dict)


   71 | 00m22s |   -0.01532 |    0.1078 |      7.0760 |            21.9854 |      0.0046 |       0.5254 | 




   72 | 00m26s |   -0.01467 |    0.1381 |     20.3244 |             5.9258 |      0.0233 |       0.7807 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   73 | 00m23s |   -0.01762 |    0.1299 |      5.5635 |            39.2355 |      0.8963 |       0.9278 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   74 | 00m26s |   -0.01436 |    0.1138 |     20.8185 |            11.8269 |      0.0121 |       0.1045 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   75 | 00m24s |   -0.01452 |    0.1021 |     10.8682 |             6.0984 |      0.0341 |       0.8196 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   76 | 00m25s |   -0.01446 |    0.1018 |      9.3908 |             6.5868 |      0.0954 |       0.9487 | 




   77 | 00m24s |   -0.01578 |    0.1054 |     10.2641 |            35.9026 |      0.0292 |       0.7328 | 
   78 | 00m27s |   -0.01473 |    0.1332 |     21.2843 |             5.5116 |      0.1131 |       0.4149 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   79 | 00m23s |   -0.01448 |    0.1140 |      7.3261 |             3.1165 |      0.1525 |       0.8313 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   80 | 00m24s |   -0.01508 |    0.1021 |     20.4661 |            22.2418 |      0.0578 |       0.5592 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   81 | 00m24s |   -0.01476 |    0.1002 |     17.3358 |             8.5673 |      0.3363 |       0.9521 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   82 | 00m29s |   -0.01526 |    0.1065 |     11.5951 |            12.0989 |      0.5254 |       0.6686 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   83 | 00m25s |   -0.01458 |    0.1167 |      9.1352 |            13.3415 |      0.0794 |       0.8425 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   84 | 00m26s |   -0.01500 |    0.1251 |      9.6766 |             3.4716 |      0.2033 |       0.8010 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   85 | 00m26s |   -0.01438 |    0.1160 |     21.9791 |            13.4262 |      0.1015 |       0.2972 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   86 | 00m25s |   -0.01490 |    0.1485 |      9.0889 |             4.3529 |      0.0391 |       0.8111 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   87 | 00m29s |   -0.01507 |    0.1096 |     12.6988 |             0.1460 |      0.0380 |       0.9835 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   88 | 00m32s |   -0.01458 |    0.1061 |     13.6735 |             6.0741 |      0.0636 |       0.0704 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   89 | 00m29s |   -0.01443 |    0.1017 |     10.3745 |             4.7903 |      0.0246 |       0.6651 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   90 | 00m26s |   -0.01520 |    0.1234 |     20.0824 |             6.6994 |      0.3241 |       0.0504 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   91 | 00m29s |   -0.01455 |    0.1067 |     22.3004 |            10.0062 |      0.0029 |       0.1963 | 




   92 | 00m32s |   -0.01463 |    0.1058 |     22.7642 |            10.5902 |      0.1902 |       0.8947 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   93 | 00m27s |   -0.01454 |    0.1240 |      6.9281 |            16.8218 |      0.0223 |       0.9999 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   94 | 00m26s |   -0.01428 |    0.1120 |      5.3113 |            11.0042 |      0.0550 |       0.8690 | 




   95 | 00m30s |   -0.01465 |    0.1083 |     15.4728 |            10.9182 |      0.0174 |       0.6217 | 




   96 | 00m34s |   -0.01510 |    0.1141 |     19.1409 |            12.0366 |      0.2706 |       0.7612 | 


  " state: %s" % convergence_dict)


   97 | 00m28s |   -0.01493 |    0.1007 |     24.8217 |            10.5765 |      0.3644 |       0.6775 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   98 | 00m30s |   -0.01478 |    0.1099 |      9.3576 |             8.4503 |      0.2115 |       0.4197 | 




   99 | 00m30s |   -0.01480 |    0.1059 |      9.5954 |            11.2917 |      0.2315 |       0.7130 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


  100 | 00m31s |   -0.01453 |    0.1259 |     14.3794 |             3.4028 |      0.1419 |       0.1936 | 




  101 | 00m33s |   -0.01490 |    0.1228 |     10.5174 |            19.3270 |      0.0363 |       0.7927 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


  102 | 00m29s |   -0.01476 |    0.1035 |     21.2173 |            14.6602 |      0.1934 |       0.2108 | 




  103 | 00m29s |   -0.01565 |    0.1372 |      5.4434 |            14.5352 |      0.3490 |       0.4144 | 


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


  104 | 00m30s |   -0.01444 |    0.1112 |      9.8806 |            18.8312 |      0.1105 |       0.2050 | 


  " state: %s" % convergence_dict)


  105 | 00m28s |   -0.01451 |    0.1070 |      7.0888 |             8.7062 |      0.0636 |       0.9782 | 


In [70]:
xgbo.res['max']['max_params']

{'gamma': 0.1032848197606477,
 'max_depth': 15.689162485552721,
 'min_child_weight': 13.535592976846267,
 'reg_alpha': 0.0031451110228144256,
 'reg_lambda': 0.9385264559396721}

In [68]:
new_regr = xgb.XGBRegressor(
                 colsample_bytree=.7,
                 gamma=xgbo.res['max']['max_params']['gamma'],
                 learning_rate=0.01,
                 max_depth=int(xgbo.res['max']['max_params']['max_depth']),
                 min_child_weight=xgbo.res['max']['max_params']['min_child_weight'],
                 n_estimators=10000,                                                                  
                 reg_alpha=xgbo.res['max']['max_params']['reg_alpha'],
                 reg_lambda=xgbo.res['max']['max_params']['reg_lambda'],
                 subsample=.5,
                 seed=1313,
                 silent=False)

new_regr.fit(prep_X, prep_y)

XGBRegressor(base_score=0.5, colsample_bylevel=1, colsample_bytree=0.7,
       gamma=0.1032848197606477, learning_rate=0.01, max_delta_step=0,
       max_depth=15, min_child_weight=13.535592976846267, missing=None,
       n_estimators=10000, nthread=-1, objective='reg:linear',
       reg_alpha=0.0031451110228144256, reg_lambda=0.9385264559396721,
       scale_pos_weight=1, seed=1313, silent=False, subsample=0.5)

In [69]:
y_pred = new_regr.predict(prep_X)

print("RMSE on training set: ", rmse(prep_y, y_pred))

RMSE on training set:  0.0774962893007


In [81]:
[int(xgbo.res['max']['max_params']['max_depth'])]

[15]

In [94]:
parameters = {
    'max_depth': [15],
    'learning_rate': [.01],
    'n_estimators': [400],
    'gamma': [xgbo.res['max']['max_params']['gamma']],
    'reg_alpha': np.linspace(start=0, stop=0.1, num=20),
    'reg_lambda': np.linspace(start=0.9, stop=.999, num=20),
    'subsample': [.5],
    'colsample_bytree': [.7],
    'min_child_weight': [xgbo.res['max']['max_params']['min_child_weight']]
    }

In [95]:
from sklearn.grid_search import GridSearchCV

In [96]:
tuning = GridSearchCV(new_regr, parameters,scoring='neg_mean_squared_error', cv=3, n_jobs=-1, verbose=1)
tuning.fit(prep_X, prep_y)
tuning.best_params_

Fitting 3 folds for each of 400 candidates, totalling 1200 fits


[Parallel(n_jobs=-1)]: Done  42 tasks      | elapsed:   39.7s
[Parallel(n_jobs=-1)]: Done 192 tasks      | elapsed:  3.0min
[Parallel(n_jobs=-1)]: Done 442 tasks      | elapsed:  6.8min
[Parallel(n_jobs=-1)]: Done 792 tasks      | elapsed: 13.0min
[Parallel(n_jobs=-1)]: Done 1200 out of 1200 | elapsed: 19.8min finished


{'colsample_bytree': 0.7,
 'gamma': 0.1032848197606477,
 'learning_rate': 0.01,
 'max_depth': 15,
 'min_child_weight': 13.535592976846267,
 'n_estimators': 400,
 'reg_alpha': 0.0,
 'reg_lambda': 0.90000000000000002,
 'subsample': 0.5}

In [97]:
new_regr = xgb.XGBRegressor(
                 colsample_bytree=.7,
                 gamma=xgbo.res['max']['max_params']['gamma'],
                 learning_rate=0.01,
                 max_depth=int(xgbo.res['max']['max_params']['max_depth']),
                 min_child_weight=xgbo.res['max']['max_params']['min_child_weight'],
                 n_estimators=1000,                                                                  
                 reg_alpha=0,
                 reg_lambda=0.9,
                 subsample=.5,
                 seed=1313,
                 silent=False)

new_regr.fit(prep_X, prep_y)

XGBRegressor(base_score=0.5, colsample_bylevel=1, colsample_bytree=0.7,
       gamma=0.1032848197606477, learning_rate=0.01, max_delta_step=0,
       max_depth=15, min_child_weight=13.535592976846267, missing=None,
       n_estimators=10000, nthread=-1, objective='reg:linear', reg_alpha=0,
       reg_lambda=0.9, scale_pos_weight=1, seed=1313, silent=False,
       subsample=0.5)

In [98]:
y_pred = new_regr.predict(prep_X)

print("RMSE on training set: ", rmse(prep_y, y_pred))

RMSE on training set:  0.0774970096088


In [99]:
test_pred = new_regr.predict(prep_test)

In [100]:
results=round(np.exp((pd.DataFrame(test_pred))),3)
results.columns = ['SalePrice']
ids = pd.read_csv('./test_id.csv',header=None)
ids.columns = ['num','Id']
results = results.set_index(ids.Id)

In [101]:
results.to_csv('new_bayes2.csv')