# Setup

Make sure this notebook works well in both python 2 and 3, import a few common modules, ensure MatplotLib plots figures inline

In [2]:
# To support both python 2 and python 3
from __future__ import division, print_function, unicode_literals

# Common imports
import numpy as np
import os

# to make this notebook's output stable across runs
np.random.seed(42)

# To plot pretty figures
%matplotlib inline
%config InlineBackend.figure_format = 'retina' # for retina screens
import matplotlib
import matplotlib.pyplot as plt
plt.rcParams['axes.labelsize'] = 14
plt.rcParams['xtick.labelsize'] = 12
plt.rcParams['ytick.labelsize'] = 12

Configure notebook to display all results in cell

In [3]:
from IPython.core.interactiveshell import InteractiveShell
InteractiveShell.ast_node_interactivity = "all"

# Revert to the last line of output only
# InteractiveShell.ast_node_interactivity = "last_expr"

# Load Data

In [4]:
import pandas as pd

houses_train = pd.read_csv('../Data/encoded.houses.train.csv')
houses_test = pd.read_csv('../Data/encoded.houses.test.csv')

In [5]:
print("houses_train dimensions: {}".format(houses_train.shape))
print("houses_test dimensions: {}".format(houses_test.shape))

houses_train dimensions: (1460, 328)
houses_test dimensions: (1459, 328)


In [6]:
pd.set_option("display.max_columns", 328)
houses_train.head(3)

Unnamed: 0.1,Unnamed: 0,MSSubClass_lev_x.120,MSSubClass_lev_x.160,MSSubClass_lev_x.180,MSSubClass_lev_x.190,MSSubClass_lev_x.20,MSSubClass_lev_x.30,MSSubClass_lev_x.40,MSSubClass_lev_x.45,MSSubClass_lev_x.50,MSSubClass_lev_x.60,MSSubClass_lev_x.70,MSSubClass_lev_x.75,MSSubClass_lev_x.80,MSSubClass_lev_x.85,MSSubClass_lev_x.90,MSZoning_lev_x.C..all.,MSZoning_lev_x.FV,MSZoning_lev_x.RH,MSZoning_lev_x.RL,MSZoning_lev_x.RM,LotFrontage_clean,LotArea_clean,Street_lev_x.Grvl,Street_lev_x.Pave,Alley_lev_x.Grvl,Alley_lev_x.NA,Alley_lev_x.Pave,LotShape_lev_x.IR1,LotShape_lev_x.IR2,LotShape_lev_x.IR3,LotShape_lev_x.Reg,LandContour_lev_x.Bnk,LandContour_lev_x.HLS,LandContour_lev_x.Low,LandContour_lev_x.Lvl,Utilities_lev_x.AllPub,Utilities_lev_x.NoSeWa,LotConfig_lev_x.Corner,LotConfig_lev_x.CulDSac,LotConfig_lev_x.FR2,LotConfig_lev_x.FR3,LotConfig_lev_x.Inside,LandSlope_lev_x.Gtl,LandSlope_lev_x.Mod,LandSlope_lev_x.Sev,Neighborhood_lev_x.Blmngtn,Neighborhood_lev_x.Blueste,Neighborhood_lev_x.BrDale,Neighborhood_lev_x.BrkSide,Neighborhood_lev_x.ClearCr,Neighborhood_lev_x.CollgCr,Neighborhood_lev_x.Crawfor,Neighborhood_lev_x.Edwards,Neighborhood_lev_x.Gilbert,Neighborhood_lev_x.IDOTRR,Neighborhood_lev_x.MeadowV,Neighborhood_lev_x.Mitchel,Neighborhood_lev_x.NAmes,Neighborhood_lev_x.NoRidge,Neighborhood_lev_x.NPkVill,Neighborhood_lev_x.NridgHt,Neighborhood_lev_x.NWAmes,Neighborhood_lev_x.OldTown,Neighborhood_lev_x.Sawyer,Neighborhood_lev_x.SawyerW,Neighborhood_lev_x.Somerst,Neighborhood_lev_x.StoneBr,Neighborhood_lev_x.SWISU,Neighborhood_lev_x.Timber,Neighborhood_lev_x.Veenker,Condition1_lev_x.Artery,Condition1_lev_x.Feedr,Condition1_lev_x.Norm,Condition1_lev_x.PosA,Condition1_lev_x.PosN,Condition1_lev_x.RRAe,Condition1_lev_x.RRAn,Condition1_lev_x.RRNe,Condition1_lev_x.RRNn,Condition2_lev_x.Artery,Condition2_lev_x.Feedr,Condition2_lev_x.Norm,Condition2_lev_x.PosA,Condition2_lev_x.PosN,Condition2_lev_x.RRAe,Condition2_lev_x.RRAn,Condition2_lev_x.RRNn,BldgType_lev_x.1Fam,BldgType_lev_x.2fmCon,BldgType_lev_x.Duplex,BldgType_lev_x.Twnhs,BldgType_lev_x.TwnhsE,HouseStyle_lev_x.1.5Fin,HouseStyle_lev_x.1.5Unf,HouseStyle_lev_x.1Story,HouseStyle_lev_x.2.5Fin,HouseStyle_lev_x.2.5Unf,HouseStyle_lev_x.2Story,HouseStyle_lev_x.SFoyer,HouseStyle_lev_x.SLvl,OverallQual_lev_x.1,OverallQual_lev_x.10,OverallQual_lev_x.2,OverallQual_lev_x.3,OverallQual_lev_x.4,OverallQual_lev_x.5,OverallQual_lev_x.6,OverallQual_lev_x.7,OverallQual_lev_x.8,OverallQual_lev_x.9,OverallCond_lev_x.1,OverallCond_lev_x.2,OverallCond_lev_x.3,OverallCond_lev_x.4,OverallCond_lev_x.5,OverallCond_lev_x.6,OverallCond_lev_x.7,OverallCond_lev_x.8,OverallCond_lev_x.9,YearBuilt_clean,YearRemodAdd_clean,RoofStyle_lev_x.Flat,RoofStyle_lev_x.Gable,RoofStyle_lev_x.Gambrel,RoofStyle_lev_x.Hip,RoofStyle_lev_x.Mansard,RoofStyle_lev_x.Shed,RoofMatl_lev_x.ClyTile,RoofMatl_lev_x.CompShg,RoofMatl_lev_x.Membran,RoofMatl_lev_x.Metal,RoofMatl_lev_x.Roll,RoofMatl_lev_x.Tar.Grv,RoofMatl_lev_x.WdShake,RoofMatl_lev_x.WdShngl,Exterior1st_lev_x.AsbShng,Exterior1st_lev_x.AsphShn,Exterior1st_lev_x.BrkComm,Exterior1st_lev_x.BrkFace,Exterior1st_lev_x.CBlock,Exterior1st_lev_x.CemntBd,Exterior1st_lev_x.HdBoard,Exterior1st_lev_x.ImStucc,Exterior1st_lev_x.MetalSd,Exterior1st_lev_x.Plywood,Exterior1st_lev_x.Stone,Exterior1st_lev_x.Stucco,Exterior1st_lev_x.VinylSd,Exterior1st_lev_x.Wd.Sdng,Exterior1st_lev_x.WdShing,Exterior2nd_lev_x.AsbShng,Exterior2nd_lev_x.AsphShn,Exterior2nd_lev_x.Brk.Cmn,Exterior2nd_lev_x.BrkFace,Exterior2nd_lev_x.CBlock,Exterior2nd_lev_x.CmentBd,Exterior2nd_lev_x.HdBoard,Exterior2nd_lev_x.ImStucc,Exterior2nd_lev_x.MetalSd,Exterior2nd_lev_x.Other,Exterior2nd_lev_x.Plywood,Exterior2nd_lev_x.Stone,Exterior2nd_lev_x.Stucco,Exterior2nd_lev_x.VinylSd,Exterior2nd_lev_x.Wd.Sdng,Exterior2nd_lev_x.Wd.Shng,MasVnrType_lev_x.BrkCmn,MasVnrType_lev_x.BrkFace,MasVnrType_lev_x.None,MasVnrType_lev_x.Stone,MasVnrArea_clean,ExterQual_lev_x.Ex,ExterQual_lev_x.Fa,ExterQual_lev_x.Gd,ExterQual_lev_x.TA,ExterCond_lev_x.Ex,ExterCond_lev_x.Fa,ExterCond_lev_x.Gd,ExterCond_lev_x.Po,ExterCond_lev_x.TA,Foundation_lev_x.BrkTil,Foundation_lev_x.CBlock,Foundation_lev_x.PConc,Foundation_lev_x.Slab,Foundation_lev_x.Stone,Foundation_lev_x.Wood,BsmtQual_lev_x.Ex,BsmtQual_lev_x.Fa,BsmtQual_lev_x.Gd,BsmtQual_lev_x.NA,BsmtQual_lev_x.TA,BsmtCond_lev_x.Fa,BsmtCond_lev_x.Gd,BsmtCond_lev_x.NA,BsmtCond_lev_x.Po,BsmtCond_lev_x.TA,BsmtExposure_lev_x.Av,BsmtExposure_lev_x.Gd,BsmtExposure_lev_x.Mn,BsmtExposure_lev_x.NA,BsmtExposure_lev_x.No,BsmtFinType1_lev_x.ALQ,BsmtFinType1_lev_x.BLQ,BsmtFinType1_lev_x.GLQ,BsmtFinType1_lev_x.LwQ,BsmtFinType1_lev_x.NA,BsmtFinType1_lev_x.Rec,BsmtFinType1_lev_x.Unf,BsmtFinSF1_clean,BsmtFinType2_lev_x.ALQ,BsmtFinType2_lev_x.BLQ,BsmtFinType2_lev_x.GLQ,BsmtFinType2_lev_x.LwQ,BsmtFinType2_lev_x.NA,BsmtFinType2_lev_x.Rec,BsmtFinType2_lev_x.Unf,BsmtFinSF2_clean,BsmtUnfSF_clean,TotalBsmtSF_clean,Heating_lev_x.Floor,Heating_lev_x.GasA,Heating_lev_x.GasW,Heating_lev_x.Grav,Heating_lev_x.OthW,Heating_lev_x.Wall,HeatingQC_lev_x.Ex,HeatingQC_lev_x.Fa,HeatingQC_lev_x.Gd,HeatingQC_lev_x.Po,HeatingQC_lev_x.TA,CentralAir_lev_x.N,CentralAir_lev_x.Y,X2ndFlrSF_clean,LowQualFinSF_clean,GrLivArea_clean,BsmtFullBath_clean,BsmtHalfBath_clean,FullBath_clean,HalfBath_clean,BedroomAbvGr_clean,KitchenAbvGr_clean,KitchenQual_lev_x.Ex,KitchenQual_lev_x.Fa,KitchenQual_lev_x.Gd,KitchenQual_lev_x.TA,TotRmsAbvGrd_clean,Functional_lev_x.Maj1,Functional_lev_x.Maj2,Functional_lev_x.Min1,Functional_lev_x.Min2,Functional_lev_x.Mod,Functional_lev_x.Sev,Functional_lev_x.Typ,Fireplaces_clean,FireplaceQu_lev_x.Ex,FireplaceQu_lev_x.Fa,FireplaceQu_lev_x.Gd,FireplaceQu_lev_x.NA,FireplaceQu_lev_x.Po,FireplaceQu_lev_x.TA,GarageType_lev_x.2Types,GarageType_lev_x.Attchd,GarageType_lev_x.Basment,GarageType_lev_x.BuiltIn,GarageType_lev_x.CarPort,GarageType_lev_x.Detchd,GarageType_lev_x.NA,GarageYrBlt_clean,GarageFinish_lev_x.Fin,GarageFinish_lev_x.NA,GarageFinish_lev_x.RFn,GarageFinish_lev_x.Unf,GarageCars_clean,GarageArea_clean,GarageQual_lev_x.Ex,GarageQual_lev_x.Fa,GarageQual_lev_x.Gd,GarageQual_lev_x.NA,GarageQual_lev_x.Po,GarageQual_lev_x.TA,GarageCond_lev_x.Ex,GarageCond_lev_x.Fa,GarageCond_lev_x.Gd,GarageCond_lev_x.NA,GarageCond_lev_x.Po,GarageCond_lev_x.TA,PavedDrive_lev_x.N,PavedDrive_lev_x.P,PavedDrive_lev_x.Y,WoodDeckSF_clean,OpenPorchSF_clean,X3SsnPorch_clean,ScreenPorch_clean,PoolArea_clean,PoolQC_lev_x.Ex,PoolQC_lev_x.Fa,PoolQC_lev_x.Gd,PoolQC_lev_x.NA,Fence_lev_x.GdPrv,Fence_lev_x.GdWo,Fence_lev_x.MnPrv,Fence_lev_x.MnWw,Fence_lev_x.NA,MiscFeature_lev_x.Gar2,MiscFeature_lev_x.NA,MiscFeature_lev_x.Othr,MiscFeature_lev_x.Shed,MiscFeature_lev_x.TenC,MiscVal_clean,MoSold_clean,YrSold_clean,SaleType_lev_x.COD,SaleType_lev_x.Con,SaleType_lev_x.ConLD,SaleType_lev_x.ConLI,SaleType_lev_x.ConLw,SaleType_lev_x.CWD,SaleType_lev_x.New,SaleType_lev_x.Oth,SaleType_lev_x.WD,SaleCondition_lev_x.Abnorml,SaleCondition_lev_x.AdjLand,SaleCondition_lev_x.Alloca,SaleCondition_lev_x.Family,SaleCondition_lev_x.Normal,SaleCondition_lev_x.Partial,SalePrice
0,1,-0.251638,-0.212287,-0.083017,-0.144792,-0.761373,-0.222645,-0.052396,-0.091003,-0.330677,1.969844,-0.206949,-0.105227,-0.203325,-0.117811,-0.192111,-0.083017,-0.215785,-0.105227,0.517956,-0.418812,-0.24015,-0.207071,-0.064216,0.064216,-0.188246,0.257733,-0.169923,-0.703962,-0.169923,-0.083017,0.760251,-0.212287,-0.188246,-0.158945,0.33701,0.026171,-0.026171,-0.468578,-0.262234,-0.182318,-0.052396,0.622549,0.23749,-0.215785,-0.094752,-0.108503,-0.037024,-0.105227,-0.203325,-0.139784,2.954209,-0.190187,-0.27107,-0.239094,-0.161194,-0.108503,-0.186288,-0.426687,-0.169923,-0.07873,-0.235877,-0.229337,-0.289539,-0.230986,-0.205144,-0.250096,-0.131946,-0.131946,-0.163415,-0.087099,-0.184312,-0.242277,0.398273,-0.074202,-0.114788,-0.087099,-0.134606,-0.037024,-0.058601,-0.037024,-0.064216,0.10185,-0.026171,-0.037024,-0.026171,-0.026171,-0.037024,0.443381,-0.147237,-0.192111,-0.174141,-0.290925,-0.343273,-0.098363,-0.994195,-0.074202,-0.087099,1.509747,-0.161194,-0.215785,-0.037024,-0.111688,-0.045361,-0.117811,-0.293684,-0.610914,-0.586641,1.890596,-0.360475,-0.174141,-0.026171,-0.058601,-0.131946,-0.201493,0.881922,-0.456581,-0.404023,-0.227679,-0.123647,1.050634,0.878367,-0.094752,0.528571,-0.087099,-0.493401,-0.069385,-0.037024,-0.026171,0.134606,-0.026171,-0.026171,-0.026171,-0.087099,-0.058601,-0.064216,-0.117811,-0.026171,-0.037024,-0.188246,-0.026171,-0.208741,-0.423319,-0.026171,-0.421067,-0.282537,-0.037024,-0.131946,1.35414,-0.405169,-0.134606,-0.117811,-0.045361,-0.069385,-0.131946,-0.026171,-0.206949,-0.406313,-0.083017,-0.414285,-0.026171,-0.328124,-0.058601,-0.134606,1.376781,-0.394805,-0.163415,-0.10185,1.509747,-1.217365,-0.309888,0.513928,-0.192111,-0.098363,1.410829,-1.278381,-0.045361,-0.139784,-0.333219,-0.026171,0.372492,-0.333219,-0.875802,1.120584,-0.129235,-0.064216,-0.045361,-0.300506,-0.156667,1.166845,-0.161194,-0.894259,-0.17827,-0.215785,-0.161194,-0.037024,0.33701,-0.422194,-0.317784,-0.290925,-0.163415,0.729136,-0.421067,-0.335749,1.578327,-0.230986,-0.161194,-0.316477,-0.645902,0.575228,-0.114788,-0.152018,-0.098363,-0.180304,-0.163415,-0.195909,0.402876,-0.288554,-0.944267,-0.459145,-0.026171,0.149645,-0.111688,-0.069385,-0.037024,-0.052396,0.984706,-0.186288,-0.444486,-0.026171,-0.643774,-0.263722,0.263722,1.161454,-0.120201,0.370207,1.107431,-0.240978,0.78947,1.227165,0.163723,-0.211381,-0.27107,-0.16561,1.220838,-1.006528,0.911897,-0.098363,-0.058601,-0.147237,-0.154359,-0.10185,-0.026171,0.27107,-0.950901,-0.129235,-0.152018,-0.592968,1.05602,-0.117811,-0.522206,-0.064216,0.823223,-0.114788,-0.253172,-0.07873,-0.600353,-0.242277,1.00706,-0.563446,-0.242277,1.567811,-0.840903,0.311618,0.35088,-0.045361,-0.184312,-0.098363,-0.242277,-0.045361,0.33701,-0.037024,-0.156667,-0.07873,-0.242277,-0.069385,0.317784,-0.25622,-0.144792,0.29915,-0.751918,0.216429,-0.116299,-0.270116,-0.068668,-0.037024,-0.037024,-0.045361,0.069385,-0.205144,-0.195909,-0.346999,-0.087099,0.488031,-0.037024,0.195909,-0.037024,-0.186288,-0.026171,-0.087658,-1.598563,0.13873,-0.174141,-0.037024,-0.07873,-0.058601,-0.058601,-0.052396,-0.301858,-0.045361,0.390159,-0.272522,-0.052396,-0.091003,-0.117811,0.467491,-0.30589,208500.0
1,2,-0.251638,-0.212287,-0.083017,-0.144792,1.312517,-0.222645,-0.052396,-0.091003,-0.330677,-0.507307,-0.206949,-0.105227,-0.203325,-0.117811,-0.192111,-0.083017,-0.215785,-0.105227,0.517956,-0.418812,0.340726,-0.091855,-0.064216,0.064216,-0.188246,0.257733,-0.169923,-0.703962,-0.169923,-0.083017,0.760251,-0.212287,-0.188246,-0.158945,0.33701,0.026171,-0.026171,-0.468578,-0.262234,5.481171,-0.052396,-1.605199,0.23749,-0.215785,-0.094752,-0.108503,-0.037024,-0.105227,-0.203325,-0.139784,-0.338268,-0.190187,-0.27107,-0.239094,-0.161194,-0.108503,-0.186288,-0.426687,-0.169923,-0.07873,-0.235877,-0.229337,-0.289539,-0.230986,-0.205144,-0.250096,-0.131946,-0.131946,-0.163415,11.473319,-0.184312,4.124686,-2.50912,-0.074202,-0.114788,-0.087099,-0.134606,-0.037024,-0.058601,-0.037024,-0.064216,0.10185,-0.026171,-0.037024,-0.026171,-0.026171,-0.037024,0.443381,-0.147237,-0.192111,-0.174141,-0.290925,-0.343273,-0.098363,1.00515,-0.074202,-0.087099,-0.661909,-0.161194,-0.215785,-0.037024,-0.111688,-0.045361,-0.117811,-0.293684,-0.610914,1.703454,-0.528571,-0.360475,-0.174141,-0.026171,-0.058601,-0.131946,-0.201493,-1.133111,-0.456581,-0.404023,4.389143,-0.123647,0.15668,-0.42943,-0.094752,0.528571,-0.087099,-0.493401,-0.069385,-0.037024,-0.026171,0.134606,-0.026171,-0.026171,-0.026171,-0.087099,-0.058601,-0.064216,-0.117811,-0.026171,-0.037024,-0.188246,-0.026171,-0.208741,-0.423319,-0.026171,2.37329,-0.282537,-0.037024,-0.131946,-0.73797,-0.405169,-0.134606,-0.117811,-0.045361,-0.069385,-0.131946,-0.026171,-0.206949,-0.406313,-0.083017,2.412145,-0.026171,-0.328124,-0.058601,-0.134606,-0.725834,-0.394805,-0.163415,-0.10185,-0.661909,0.820884,-0.309888,-0.570555,-0.192111,-0.098363,-0.708318,0.781703,-0.045361,-0.139784,-0.333219,-0.026171,0.372492,-0.333219,1.141029,-0.891781,-0.129235,-0.064216,-0.045361,-0.300506,-0.156667,1.166845,-0.161194,-0.894259,-0.17827,-0.215785,-0.161194,-0.037024,0.33701,-0.422194,3.144637,-0.290925,-0.163415,-1.370546,2.37329,-0.335749,-0.633148,-0.230986,-0.161194,-0.316477,-0.645902,1.171591,-0.114788,-0.152018,-0.098363,-0.180304,-0.163415,-0.195909,0.402876,-0.288554,-0.641008,0.466305,-0.026171,0.149645,-0.111688,-0.069385,-0.037024,-0.052396,0.984706,-0.186288,-0.444486,-0.026171,-0.643774,-0.263722,0.263722,-0.794891,-0.120201,-0.482347,-0.819684,3.947457,0.78947,-0.76136,0.163723,-0.211381,-0.27107,-0.16561,-0.818548,0.992834,-0.318574,-0.098363,-0.058601,-0.147237,-0.154359,-0.10185,-0.026171,0.27107,0.600289,-0.129235,-0.152018,-0.592968,-0.946303,-0.117811,1.913642,-0.064216,0.823223,-0.114788,-0.253172,-0.07873,-0.600353,-0.242277,-0.019293,-0.563446,-0.242277,1.567811,-0.840903,0.311618,-0.06071,-0.045361,-0.184312,-0.098363,-0.242277,-0.045361,0.33701,-0.037024,-0.156667,-0.07873,-0.242277,-0.069385,0.317784,-0.25622,-0.144792,0.29915,1.625638,-0.704242,-0.116299,-0.270116,-0.068668,-0.037024,-0.037024,-0.045361,0.069385,-0.205144,-0.195909,-0.346999,-0.087099,0.488031,-0.037024,0.195909,-0.037024,-0.186288,-0.026171,-0.087658,-0.488943,-0.614228,-0.174141,-0.037024,-0.07873,-0.058601,-0.058601,-0.052396,-0.301858,-0.045361,0.390159,-0.272522,-0.052396,-0.091003,-0.117811,0.467491,-0.30589,181500.0
2,3,-0.251638,-0.212287,-0.083017,-0.144792,-0.761373,-0.222645,-0.052396,-0.091003,-0.330677,1.969844,-0.206949,-0.105227,-0.203325,-0.117811,-0.192111,-0.083017,-0.215785,-0.105227,0.517956,-0.418812,-0.123975,0.073455,-0.064216,0.064216,-0.188246,0.257733,-0.169923,1.419559,-0.169923,-0.083017,-1.314453,-0.212287,-0.188246,-0.158945,0.33701,0.026171,-0.026171,-0.468578,-0.262234,-0.182318,-0.052396,0.622549,0.23749,-0.215785,-0.094752,-0.108503,-0.037024,-0.105227,-0.203325,-0.139784,2.954209,-0.190187,-0.27107,-0.239094,-0.161194,-0.108503,-0.186288,-0.426687,-0.169923,-0.07873,-0.235877,-0.229337,-0.289539,-0.230986,-0.205144,-0.250096,-0.131946,-0.131946,-0.163415,-0.087099,-0.184312,-0.242277,0.398273,-0.074202,-0.114788,-0.087099,-0.134606,-0.037024,-0.058601,-0.037024,-0.064216,0.10185,-0.026171,-0.037024,-0.026171,-0.026171,-0.037024,0.443381,-0.147237,-0.192111,-0.174141,-0.290925,-0.343273,-0.098363,-0.994195,-0.074202,-0.087099,1.509747,-0.161194,-0.215785,-0.037024,-0.111688,-0.045361,-0.117811,-0.293684,-0.610914,-0.586641,1.890596,-0.360475,-0.174141,-0.026171,-0.058601,-0.131946,-0.201493,0.881922,-0.456581,-0.404023,-0.227679,-0.123647,0.984415,0.82993,-0.094752,0.528571,-0.087099,-0.493401,-0.069385,-0.037024,-0.026171,0.134606,-0.026171,-0.026171,-0.026171,-0.087099,-0.058601,-0.064216,-0.117811,-0.026171,-0.037024,-0.188246,-0.026171,-0.208741,-0.423319,-0.026171,-0.421067,-0.282537,-0.037024,-0.131946,1.35414,-0.405169,-0.134606,-0.117811,-0.045361,-0.069385,-0.131946,-0.026171,-0.206949,-0.406313,-0.083017,-0.414285,-0.026171,-0.328124,-0.058601,-0.134606,1.376781,-0.394805,-0.163415,-0.10185,1.509747,-1.217365,-0.309888,0.325803,-0.192111,-0.098363,1.410829,-1.278381,-0.045361,-0.139784,-0.333219,-0.026171,0.372492,-0.333219,-0.875802,1.120584,-0.129235,-0.064216,-0.045361,-0.300506,-0.156667,1.166845,-0.161194,-0.894259,-0.17827,-0.215785,-0.161194,-0.037024,0.33701,-0.422194,-0.317784,3.434957,-0.163415,-1.370546,-0.421067,-0.335749,1.578327,-0.230986,-0.161194,-0.316477,-0.645902,0.092875,-0.114788,-0.152018,-0.098363,-0.180304,-0.163415,-0.195909,0.402876,-0.288554,-0.30154,-0.313261,-0.026171,0.149645,-0.111688,-0.069385,-0.037024,-0.052396,0.984706,-0.186288,-0.444486,-0.026171,-0.643774,-0.263722,0.263722,1.188943,-0.120201,0.514836,1.107431,-0.240978,0.78947,1.227165,0.163723,-0.211381,-0.27107,-0.16561,1.220838,-1.006528,-0.318574,-0.098363,-0.058601,-0.147237,-0.154359,-0.10185,-0.026171,0.27107,0.600289,-0.129235,-0.152018,-0.592968,-0.946303,-0.117811,1.913642,-0.064216,0.823223,-0.114788,-0.253172,-0.07873,-0.600353,-0.242277,0.931034,-0.563446,-0.242277,1.567811,-0.840903,0.311618,0.63151,-0.045361,-0.184312,-0.098363,-0.242277,-0.045361,0.33701,-0.037024,-0.156667,-0.07873,-0.242277,-0.069385,0.317784,-0.25622,-0.144792,0.29915,-0.751918,-0.070337,-0.116299,-0.270116,-0.068668,-0.037024,-0.037024,-0.045361,0.069385,-0.205144,-0.195909,-0.346999,-0.087099,0.488031,-0.037024,0.195909,-0.037024,-0.186288,-0.026171,-0.087658,0.990552,0.13873,-0.174141,-0.037024,-0.07873,-0.058601,-0.058601,-0.052396,-0.301858,-0.045361,0.390159,-0.272522,-0.052396,-0.091003,-0.117811,0.467491,-0.30589,223500.0


In [7]:
houses_train.info()
houses_test.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1460 entries, 0 to 1459
Columns: 328 entries, Unnamed: 0 to SalePrice
dtypes: float64(327), int64(1)
memory usage: 3.7 MB
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1459 entries, 0 to 1458
Columns: 328 entries, Unnamed: 0 to SalePrice
dtypes: float64(308), int64(20)
memory usage: 3.7 MB


Delete first column

In [8]:
houses_train.drop('Unnamed: 0', axis=1, inplace=True, errors='raise')
houses_test.drop('Unnamed: 0', axis=1, inplace=True, errors='raise')

# Run xgboost

### Create private training & test set

In [9]:
from sklearn.model_selection import train_test_split

seed = 10
test_ratio = 0.2

X = houses_train.loc[:, houses_train.columns != "SalePrice"]
y = houses_train.loc[:, houses_train.columns == "SalePrice"]

# Take log of SalePrice
y = log(y + 1)


In [None]:
X_pr_train, X_pr_test, y_pr_train, y_pr_test = train_test_split(X, y, test_size=test_ratio, random_state=seed)

In [11]:
y_pr_train.shape
y_pr_train.ravel().shape

(1168, 1)

### Fit Model

In [None]:
from xgboost import XGBClassifier

model = XGBClassifier()
model.fit(X_pr_train, y_pr_train)

  y = column_or_1d(y, warn=True)
  y = column_or_1d(y, warn=True)


In [None]:
from xgboost import XGBClassifier

# run with log of y

model = XGBClassifier()
model.fit(X_pr_train, y_pr_train.ravel())

In [None]:
# make predictions for test data
y_pr_pred = model.predict(X_pr_test)
predictions = [round(value) for value in y_pr_pred]

Evaluate predictions

In [None]:
from sklearn.metrics import mean_squared_error

mse = mean_squared_error(y_pr_test, predictions)
rmse = np.sqrt(final_mse)
