# Feature Selection Advanced House Price Prediction

## The main aim of this project is to predict the house price based on various features which we will discuss as we go ahead
## Dataset to downloaded from the below link
#### https://www.kaggle.com/c/house-prices-advanced-regression-techniques/data

In [176]:
import pandas as pd
import numpy as np

import matplotlib.pyplot as plt
%matplotlib inline

## for feature slection

from sklearn.linear_model import Lasso
from sklearn.feature_selection import SelectFromModel

# to visualise al the columns in the dataframe
pd.pandas.set_option('display.max_columns', None)

In [177]:
dataset=pd.read_csv('X_train.csv')
dataset.head().shape

(5, 381)

In [178]:
## Capture the dependent feature
y_train=dataset[['SalePrice']]


In [179]:
## drop dependent feature from dataset
X_train=dataset.drop(['Id','SalePrice'],axis=1)
X_train.head().shape

(5, 379)

In [180]:
### Apply Feature Selection
# first, I specify the Lasso Regression model, and I
# select a suitable alpha (equivalent of penalty).
# The bigger the alpha the less features that will be selected.

# Then I use the selectFromModel object from sklearn, which
# will select the features which coefficients are non-zero

feature_sel_model = SelectFromModel(Lasso(alpha=0.005, random_state=0)) # remember to set the seed, the random state in this function
feature_sel_model.fit(X_train, y_train)



SelectFromModel(estimator=Lasso(alpha=0.005, copy_X=True, fit_intercept=True, max_iter=1000,
   normalize=False, positive=False, precompute=False, random_state=0,
   selection='cyclic', tol=0.0001, warm_start=False),
        norm_order=1, prefit=False, threshold=None)

In [181]:
feature_sel_model.get_support()

array([ True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,

In [182]:
# let's print the number of total and selected features

# this is how we can make a list of the selected features
selected_feat = X_train.columns[(feature_sel_model.get_support())]

# let's print some stats
print('total features: {}'.format((X_train.shape[1])))
print('selected features: {}'.format(len(selected_feat)))
print('features with coefficients shrank to zero: {}'.format(
    np.sum(feature_sel_model.estimator_.coef_ == 0)))

total features: 379
selected features: 378
features with coefficients shrank to zero: 1


In [183]:
selected_feat

Index(['MSSubClass', 'LotFrontage', 'LotArea', 'OverallQual', 'OverallCond',
       'YearBuilt', 'YearRemodAdd', 'MasVnrArea', 'BsmtFinSF1', 'BsmtFinSF2',
       ...
       'Fence_missing.1', 'MiscFeature_Shed.1', 'MiscFeature_missing.1',
       'SaleType_New.1', 'SaleType_Rare_var.1', 'SaleType_WD.1',
       'SaleCondition_Family.1', 'SaleCondition_Normal.1',
       'SaleCondition_Partial.1', 'SaleCondition_Rare_var.1'],
      dtype='object', length=378)

In [184]:
X_train_data=X_train[selected_feat]

In [185]:

X_train_data.head()

Unnamed: 0,MSSubClass,LotFrontage,LotArea,OverallQual,OverallCond,YearBuilt,YearRemodAdd,MasVnrArea,BsmtFinSF1,BsmtFinSF2,BsmtUnfSF,TotalBsmtSF,1stFlrSF,2ndFlrSF,LowQualFinSF,GrLivArea,BsmtFullBath,BsmtHalfBath,FullBath,HalfBath,BedroomAbvGr,KitchenAbvGr,TotRmsAbvGrd,Fireplaces,GarageYrBlt,GarageCars,GarageArea,WoodDeckSF,OpenPorchSF,EnclosedPorch,3SsnPorch,ScreenPorch,PoolArea,MiscVal,MoSold,YrSold,LotFrontage_nan,MasVnrArea_nan,GarageYrBlt_nan,MSZoning_RH,MSZoning_RL,MSZoning_RM,MSZoning_Rare_var,Street_Rare_var,Alley_Pave,Alley_missing,LotShape_IR2,LotShape_Rare_var,LotShape_Reg,LandContour_HLS,LandContour_Low,LandContour_Lvl,Utilities_Rare_var,LotConfig_CulDSac,LotConfig_FR2,LotConfig_Inside,LotConfig_Rare_var,LandSlope_Mod,LandSlope_Rare_var,Neighborhood_BrDale,Neighborhood_BrkSide,Neighborhood_ClearCr,Neighborhood_CollgCr,Neighborhood_Crawfor,Neighborhood_Edwards,Neighborhood_Gilbert,Neighborhood_IDOTRR,Neighborhood_MeadowV,Neighborhood_Mitchel,Neighborhood_NAmes,Neighborhood_NWAmes,Neighborhood_NoRidge,Neighborhood_NridgHt,Neighborhood_OldTown,Neighborhood_Rare_var,Neighborhood_SWISU,Neighborhood_Sawyer,Neighborhood_SawyerW,Neighborhood_Somerst,Neighborhood_StoneBr,Neighborhood_Timber,Condition1_Feedr,Condition1_Norm,Condition1_PosN,Condition1_RRAn,Condition1_Rare_var,Condition2_Rare_var,BldgType_2fmCon,BldgType_Duplex,BldgType_Twnhs,BldgType_TwnhsE,HouseStyle_1Story,HouseStyle_2Story,HouseStyle_Rare_var,HouseStyle_SFoyer,HouseStyle_SLvl,RoofStyle_Hip,RoofStyle_Rare_var,RoofMatl_Rare_var,Exterior1st_BrkFace,Exterior1st_CemntBd,Exterior1st_HdBoard,Exterior1st_MetalSd,Exterior1st_Plywood,Exterior1st_Rare_var,Exterior1st_Stucco,Exterior1st_VinylSd,Exterior1st_Wd Sdng,Exterior1st_WdShing,Exterior2nd_BrkFace,Exterior2nd_CmentBd,Exterior2nd_HdBoard,Exterior2nd_MetalSd,Exterior2nd_Plywood,Exterior2nd_Rare_var,Exterior2nd_Stucco,Exterior2nd_VinylSd,Exterior2nd_Wd Sdng,Exterior2nd_Wd Shng,MasVnrType_BrkFace,MasVnrType_None,MasVnrType_Rare_var,MasVnrType_Stone,ExterQual_Gd,ExterQual_Rare_var,ExterQual_TA,ExterCond_Gd,ExterCond_Rare_var,ExterCond_TA,Foundation_CBlock,Foundation_PConc,Foundation_Rare_var,Foundation_Slab,BsmtQual_Fa,BsmtQual_Gd,BsmtQual_TA,BsmtQual_missing,BsmtCond_Gd,BsmtCond_Rare_var,BsmtCond_TA,BsmtCond_missing,BsmtExposure_Gd,BsmtExposure_Mn,BsmtExposure_No,BsmtExposure_missing,BsmtFinType1_BLQ,BsmtFinType1_GLQ,BsmtFinType1_LwQ,BsmtFinType1_Rec,BsmtFinType1_Unf,BsmtFinType1_missing,BsmtFinType2_BLQ,BsmtFinType2_LwQ,BsmtFinType2_Rare_var,BsmtFinType2_Rec,BsmtFinType2_Unf,BsmtFinType2_missing,Heating_GasW,Heating_Rare_var,HeatingQC_Fa,HeatingQC_Gd,HeatingQC_Rare_var,HeatingQC_TA,CentralAir_Y,Electrical_FuseF,Electrical_Rare_var,Electrical_SBrkr,KitchenQual_Fa,KitchenQual_Gd,KitchenQual_TA,Functional_Min2,Functional_Mod,Functional_Rare_var,Functional_Typ,FireplaceQu_Fa,FireplaceQu_Gd,FireplaceQu_Po,FireplaceQu_TA,FireplaceQu_missing,GarageType_Basment,GarageType_BuiltIn,GarageType_Detchd,GarageType_Rare_var,GarageType_missing,GarageFinish_RFn,GarageFinish_Unf,GarageFinish_missing,GarageQual_Rare_var,GarageQual_TA,GarageQual_missing,GarageCond_Rare_var,GarageCond_TA,GarageCond_missing,PavedDrive_P,PavedDrive_Y,PoolQC_missing,Fence_GdWo,Fence_MnPrv,Fence_Rare_var,Fence_missing,MiscFeature_Shed,MiscFeature_missing,SaleType_New,SaleType_Rare_var,SaleType_WD,SaleCondition_Family,SaleCondition_Normal,SaleCondition_Partial,SaleCondition_Rare_var,MSZoning_RH.1,MSZoning_RL.1,MSZoning_RM.1,MSZoning_Rare_var.1,Street_Rare_var.1,Alley_Pave.1,Alley_missing.1,LotShape_IR2.1,LotShape_Rare_var.1,LotShape_Reg.1,LandContour_HLS.1,LandContour_Low.1,LandContour_Lvl.1,Utilities_Rare_var.1,LotConfig_CulDSac.1,LotConfig_FR2.1,LotConfig_Inside.1,LotConfig_Rare_var.1,LandSlope_Mod.1,LandSlope_Rare_var.1,Neighborhood_BrDale.1,Neighborhood_BrkSide.1,Neighborhood_ClearCr.1,Neighborhood_CollgCr.1,Neighborhood_Crawfor.1,Neighborhood_Edwards.1,Neighborhood_Gilbert.1,Neighborhood_IDOTRR.1,Neighborhood_MeadowV.1,Neighborhood_Mitchel.1,Neighborhood_NAmes.1,Neighborhood_NWAmes.1,Neighborhood_NoRidge.1,Neighborhood_NridgHt.1,Neighborhood_OldTown.1,Neighborhood_Rare_var.1,Neighborhood_SWISU.1,Neighborhood_Sawyer.1,Neighborhood_SawyerW.1,Neighborhood_Somerst.1,Neighborhood_StoneBr.1,Neighborhood_Timber.1,Condition1_Feedr.1,Condition1_Norm.1,Condition1_PosN.1,Condition1_RRAn.1,Condition1_Rare_var.1,Condition2_Rare_var.1,BldgType_2fmCon.1,BldgType_Duplex.1,BldgType_Twnhs.1,BldgType_TwnhsE.1,HouseStyle_1Story.1,HouseStyle_2Story.1,HouseStyle_Rare_var.1,HouseStyle_SFoyer.1,HouseStyle_SLvl.1,RoofStyle_Hip.1,RoofStyle_Rare_var.1,RoofMatl_Rare_var.1,Exterior1st_BrkFace.1,Exterior1st_CemntBd.1,Exterior1st_HdBoard.1,Exterior1st_MetalSd.1,Exterior1st_Plywood.1,Exterior1st_Rare_var.1,Exterior1st_Stucco.1,Exterior1st_VinylSd.1,Exterior1st_Wd Sdng.1,Exterior1st_WdShing.1,Exterior2nd_BrkFace.1,Exterior2nd_CmentBd.1,Exterior2nd_HdBoard.1,Exterior2nd_MetalSd.1,Exterior2nd_Plywood.1,Exterior2nd_Rare_var.1,Exterior2nd_Stucco.1,Exterior2nd_VinylSd.1,Exterior2nd_Wd Sdng.1,Exterior2nd_Wd Shng.1,MasVnrType_BrkFace.1,MasVnrType_None.1,MasVnrType_Stone.1,ExterQual_Gd.1,ExterQual_Rare_var.1,ExterQual_TA.1,ExterCond_Gd.1,ExterCond_Rare_var.1,ExterCond_TA.1,Foundation_CBlock.1,Foundation_PConc.1,Foundation_Rare_var.1,Foundation_Slab.1,BsmtQual_Fa.1,BsmtQual_Gd.1,BsmtQual_TA.1,BsmtQual_missing.1,BsmtCond_Gd.1,BsmtCond_Rare_var.1,BsmtCond_TA.1,BsmtCond_missing.1,BsmtExposure_Gd.1,BsmtExposure_Mn.1,BsmtExposure_No.1,BsmtExposure_missing.1,BsmtFinType1_BLQ.1,BsmtFinType1_GLQ.1,BsmtFinType1_LwQ.1,BsmtFinType1_Rec.1,BsmtFinType1_Unf.1,BsmtFinType1_missing.1,BsmtFinType2_BLQ.1,BsmtFinType2_LwQ.1,BsmtFinType2_Rare_var.1,BsmtFinType2_Rec.1,BsmtFinType2_Unf.1,BsmtFinType2_missing.1,Heating_GasW.1,Heating_Rare_var.1,HeatingQC_Fa.1,HeatingQC_Gd.1,HeatingQC_Rare_var.1,HeatingQC_TA.1,CentralAir_Y.1,Electrical_FuseF.1,Electrical_Rare_var.1,Electrical_SBrkr.1,KitchenQual_Fa.1,KitchenQual_Gd.1,KitchenQual_TA.1,Functional_Min2.1,Functional_Mod.1,Functional_Rare_var.1,Functional_Typ.1,FireplaceQu_Fa.1,FireplaceQu_Gd.1,FireplaceQu_Po.1,FireplaceQu_TA.1,FireplaceQu_missing.1,GarageType_Basment.1,GarageType_BuiltIn.1,GarageType_Detchd.1,GarageType_Rare_var.1,GarageType_missing.1,GarageFinish_RFn.1,GarageFinish_Unf.1,GarageFinish_missing.1,GarageQual_Rare_var.1,GarageQual_TA.1,GarageQual_missing.1,GarageCond_Rare_var.1,GarageCond_TA.1,GarageCond_missing.1,PavedDrive_P.1,PavedDrive_Y.1,PoolQC_missing.1,Fence_GdWo.1,Fence_MnPrv.1,Fence_Rare_var.1,Fence_missing.1,MiscFeature_Shed.1,MiscFeature_missing.1,SaleType_New.1,SaleType_Rare_var.1,SaleType_WD.1,SaleCondition_Family.1,SaleCondition_Normal.1,SaleCondition_Partial.1,SaleCondition_Rare_var.1
0,0.235294,0.418208,0.366344,0.666667,0.5,0.036765,0.098361,0.1225,0.125089,0.0,0.064212,0.140098,0.356155,0.413559,0.0,0.577712,0.333333,0.0,0.666667,0.5,0.375,0.333333,0.5,0.0,0.046729,0.5,0.38646,0.0,0.111517,0.0,0.0,0.0,0.0,0.0,0.090909,0.5,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0,1,0,0,0,0,1,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,1,0,0,0,0,1,0,1,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,1,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,1,1,0,0,0,1,0,1,0,0,1,0,1,0,0
1,0.0,0.495064,0.391317,0.555556,0.875,0.227941,0.52459,0.0,0.173281,0.0,0.121575,0.206547,0.503056,0.0,0.0,0.470245,0.0,0.5,0.666667,0.0,0.375,0.333333,0.333333,0.333333,0.28972,0.5,0.324401,0.347725,0.0,0.0,0.0,0.0,0.0,0.0,0.363636,0.25,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0,1,0,0,0,0,1,0,0,1,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0,1,1,0,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,1,1,0,0,0,1,0,1,0,0,1,0,1,0,0
2,0.235294,0.434909,0.422359,0.666667,0.5,0.051471,0.114754,0.10125,0.086109,0.0,0.185788,0.150573,0.383441,0.41937,0.0,0.593095,0.333333,0.0,0.666667,0.5,0.375,0.333333,0.333333,0.333333,0.065421,0.5,0.428773,0.0,0.076782,0.0,0.0,0.0,0.0,0.0,0.727273,0.5,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,1,0,0,0,0,1,0,1,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,1,1,0,0,0,1,0,1,0,0,1,0,1,0,0
3,0.294118,0.388581,0.390295,0.666667,0.5,0.669118,0.606557,0.0,0.038271,0.0,0.231164,0.123732,0.399941,0.366102,0.0,0.579157,0.333333,0.0,0.333333,0.0,0.375,0.333333,0.416667,0.333333,0.074766,0.75,0.45275,0.0,0.063985,0.492754,0.0,0.0,0.0,0.0,0.090909,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,1,0,0,1,0,1,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,1,0,0,1,1,0,0,0,1,0,1,0,0,1,0,0,0,0
4,0.235294,0.513123,0.468761,0.777778,0.5,0.058824,0.147541,0.21875,0.116052,0.0,0.20976,0.187398,0.466237,0.509927,0.0,0.666523,0.333333,0.0,0.666667,0.5,0.5,0.333333,0.583333,0.333333,0.074766,0.75,0.589563,0.224037,0.153565,0.0,0.0,0.0,0.0,0.0,1.0,0.5,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,1,0,0,0,0,1,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,1,1,0,0,0,1,0,1,0,0,1,0,1,0,0


In [186]:
X_train_data.shape

(1460, 378)

In [187]:
X_train_data.to_csv('X_train_selected_feature.csv',index=False)

In [188]:
y_train.to_csv('train_data_feature_y_final.csv',index=False)

In [189]:
X_train_data.columns

Index(['MSSubClass', 'LotFrontage', 'LotArea', 'OverallQual', 'OverallCond',
       'YearBuilt', 'YearRemodAdd', 'MasVnrArea', 'BsmtFinSF1', 'BsmtFinSF2',
       ...
       'Fence_missing.1', 'MiscFeature_Shed.1', 'MiscFeature_missing.1',
       'SaleType_New.1', 'SaleType_Rare_var.1', 'SaleType_WD.1',
       'SaleCondition_Family.1', 'SaleCondition_Normal.1',
       'SaleCondition_Partial.1', 'SaleCondition_Rare_var.1'],
      dtype='object', length=378)