## Data Preprocessing- Gurgaon Independent Houses Data
### @cipher499
### 06/12/23

In [1]:
import pandas as pd
import numpy as np
import re

In [2]:
# setting to display all the columns and rows in the data
pd.set_option('display.max_rows', None)
pd.set_option('display.max_columns', None)

In [3]:
# read the data into a dataframe
df = pd.read_excel('data/gurgaon/independent_houses/independent_houses.xlsx')
df.head()

Unnamed: 0,property_name,society,price,rate,area,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,num_floor,facing,age_possession,nearby_locations,description,furnish_details,features,rating
0,5 Bedroom House for sale in Sector 70A Gurgaon,Bptp Visionnaire,5.25 Crore,"₹ 20,115/sq.ft.",(242 sq.m.) Plot Area,Plot area 290(242.48 sq.m.),5 Bedrooms,4 Bathrooms,3+ Balconies,Servant Room,"29b, Sector 70A Gurgaon, Gurgaon, Haryana",3 Floors,North-East,0 to 1 Year Old,"['Good Earth City Center 2', 'Kunskapsskolan I...",Do you wish to buy an independent house in sec...,"['1 Wardrobe', '1 Fan', '1 Exhaust Fan', '1 Ge...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Lifestyle4 out of 5..."
1,5 Bedroom House for sale in Sector 21A Faridabad,,5.7 Crore,"₹ 105,751/sq.ft.",(50 sq.m.) Plot Area,Plot area 539(50.07 sq.m.),5 Bedrooms,4 Bathrooms,2 Balconies,"Store Room,Pooja Room,Servant Room","Sector 21A Faridabad, Gurgaon, Haryana",2 Floors,,5 to 10 Year Old,,"Hi, we have an independent house/villa availab...","['1 Water Purifier', '5 Fan', '1 Exhaust Fan',...","['Private Garden / Terrace', 'Park', 'Visitor ...",
2,10 Bedroom House for sale in Sushant Lok Phase 1,,2.1 Crore,"₹ 38,251/sq.ft.",(51 sq.m.) Plot Area,Plot area 61(51 sq.m.),10 Bedrooms,10 Bathrooms,3+ Balconies,Servant Room,"Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,0 to 1 Year Old,"['Sector 42-43 metro station', 'Huda city cent...","Monthly rental income is rs1,40,000/- Best opt...","['10 Bed', '3 Fan', '10 Geyser', '2 Light', 'N...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."
3,21 Bedroom House for sale in Sector 54 Gurgaon,,5 Crore,"₹ 43,066/sq.ft.",(108 sq.m.) Plot Area,Plot area 129(107.86 sq.m.),21 Bedrooms,21 Bathrooms,3+ Balconies,Servant Room,"Sector 54 Gurgaon, Gurgaon, Haryana",5 Floors,North,1 to 5 Year Old,"['Sector 53-54 metro station', 'Sector 54 chow...","129 sq yd plot size. 5 floors built up , fully...","['1 Water Purifier', '21 Fan', '1 Fridge', '1 ...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment4 out of 5', 'Lifestyle5 out of 5..."
4,12 Bedroom House for sale in Sushant Lok Phase 1,,3 Crore,"₹ 53,763/sq.ft.",(52 sq.m.) Plot Area,Plot area 62(51.84 sq.m.),12 Bedrooms,12 Bathrooms,3+ Balconies,Others,"1228, Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,Within 6 months,"['Sector 42-43 metro station', 'Huda city cent...",Best for investment purpose. Fully furnished b...,"['1 Water Purifier', '1 Fridge', '12 Fan', '1 ...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."


In [4]:
# dimensions of the dataset
df.shape

(1082, 19)

In [5]:
# columns and their data types
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1082 entries, 0 to 1081
Data columns (total 19 columns):
 #   Column            Non-Null Count  Dtype 
---  ------            --------------  ----- 
 0   property_name     1082 non-null   object
 1   society           463 non-null    object
 2   price             955 non-null    object
 3   rate              1041 non-null   object
 4   area              1082 non-null   object
 5   areaWithType      974 non-null    object
 6   bedrooms          974 non-null    object
 7   bathrooms         974 non-null    object
 8   balconies         974 non-null    object
 9   additional_room   578 non-null    object
 10  address           1018 non-null   object
 11  num_floor         955 non-null    object
 12  facing            662 non-null    object
 13  age_possession    974 non-null    object
 14  nearby_locations  900 non-null    object
 15  description       1023 non-null   object
 16  furnish_details   732 non-null    object
 17  features      

In [6]:
# check for null values
df.isnull().sum()

property_name         0
society             619
price               127
rate                 41
area                  0
areaWithType        108
bedrooms            108
bathrooms           108
balconies           108
additional_room     504
address              64
num_floor           127
facing              420
age_possession      108
nearby_locations    182
description          59
furnish_details     350
features            420
rating              188
dtype: int64

In [14]:
# remove duplicate rows
df = df[~df.duplicated()]
df.duplicated().sum()

0

In [15]:
# rename the area column
df.rename(columns={'area': 'price_per_sqft'}, inplace=True) 
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,num_floor,facing,age_possession,nearby_locations,description,furnish_details,features,rating
0,5 Bedroom House for sale in Sector 70A Gurgaon,Bptp Visionnaire,5.25 Crore,"₹ 20,115/sq.ft.",(242 sq.m.) Plot Area,Plot area 290(242.48 sq.m.),5 Bedrooms,4 Bathrooms,3+ Balconies,Servant Room,"29b, Sector 70A Gurgaon, Gurgaon, Haryana",3 Floors,North-East,0 to 1 Year Old,"['Good Earth City Center 2', 'Kunskapsskolan I...",Do you wish to buy an independent house in sec...,"['1 Wardrobe', '1 Fan', '1 Exhaust Fan', '1 Ge...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Lifestyle4 out of 5..."
1,5 Bedroom House for sale in Sector 21A Faridabad,,5.7 Crore,"₹ 105,751/sq.ft.",(50 sq.m.) Plot Area,Plot area 539(50.07 sq.m.),5 Bedrooms,4 Bathrooms,2 Balconies,"Store Room,Pooja Room,Servant Room","Sector 21A Faridabad, Gurgaon, Haryana",2 Floors,,5 to 10 Year Old,,"Hi, we have an independent house/villa availab...","['1 Water Purifier', '5 Fan', '1 Exhaust Fan',...","['Private Garden / Terrace', 'Park', 'Visitor ...",
2,10 Bedroom House for sale in Sushant Lok Phase 1,,2.1 Crore,"₹ 38,251/sq.ft.",(51 sq.m.) Plot Area,Plot area 61(51 sq.m.),10 Bedrooms,10 Bathrooms,3+ Balconies,Servant Room,"Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,0 to 1 Year Old,"['Sector 42-43 metro station', 'Huda city cent...","Monthly rental income is rs1,40,000/- Best opt...","['10 Bed', '3 Fan', '10 Geyser', '2 Light', 'N...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."
3,21 Bedroom House for sale in Sector 54 Gurgaon,,5 Crore,"₹ 43,066/sq.ft.",(108 sq.m.) Plot Area,Plot area 129(107.86 sq.m.),21 Bedrooms,21 Bathrooms,3+ Balconies,Servant Room,"Sector 54 Gurgaon, Gurgaon, Haryana",5 Floors,North,1 to 5 Year Old,"['Sector 53-54 metro station', 'Sector 54 chow...","129 sq yd plot size. 5 floors built up , fully...","['1 Water Purifier', '21 Fan', '1 Fridge', '1 ...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment4 out of 5', 'Lifestyle5 out of 5..."
4,12 Bedroom House for sale in Sushant Lok Phase 1,,3 Crore,"₹ 53,763/sq.ft.",(52 sq.m.) Plot Area,Plot area 62(51.84 sq.m.),12 Bedrooms,12 Bathrooms,3+ Balconies,Others,"1228, Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,Within 6 months,"['Sector 42-43 metro station', 'Huda city cent...",Best for investment purpose. Fully furnished b...,"['1 Water Purifier', '1 Fridge', '12 Fan', '1 ...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."


In [17]:
df.society.value_counts().sample(15)

Signature Global City 81                        1
Central Park                                    1
private house                                   1
secter 16a daultabad faridabad house no 313     1
Ashok vihar phase III Extension                 1
Unitech Uniworld Resorts                       14
Surat nagar phase 2                             1
Huda Floor                                      1
Puri Diplomatic Greens4.0 ★                     3
Vatika Sovereign Next                           1
Prem Kunj                                       1
DLF New Town Heights3.7 ★                       1
Shivaji Nagar Residential                       1
DLF Gardencity Enclave                          1
Sector 15 Part 2 RWA                            1
Name: society, dtype: int64

In [19]:
df.society.value_counts().shape

(188,)

In [20]:
# apply a regex transformation to the society column to parse out the society names
df.society = df.society.apply(lambda name: re.sub(r'\d+(\.\d+)?\s?★', '', str(name)).strip()).str.lower()
df.society.value_counts().shape

(186,)

In [22]:
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,num_floor,facing,age_possession,nearby_locations,description,furnish_details,features,rating
0,5 Bedroom House for sale in Sector 70A Gurgaon,bptp visionnaire,5.25 Crore,"₹ 20,115/sq.ft.",(242 sq.m.) Plot Area,Plot area 290(242.48 sq.m.),5 Bedrooms,4 Bathrooms,3+ Balconies,Servant Room,"29b, Sector 70A Gurgaon, Gurgaon, Haryana",3 Floors,North-East,0 to 1 Year Old,"['Good Earth City Center 2', 'Kunskapsskolan I...",Do you wish to buy an independent house in sec...,"['1 Wardrobe', '1 Fan', '1 Exhaust Fan', '1 Ge...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Lifestyle4 out of 5..."
1,5 Bedroom House for sale in Sector 21A Faridabad,,5.7 Crore,"₹ 105,751/sq.ft.",(50 sq.m.) Plot Area,Plot area 539(50.07 sq.m.),5 Bedrooms,4 Bathrooms,2 Balconies,"Store Room,Pooja Room,Servant Room","Sector 21A Faridabad, Gurgaon, Haryana",2 Floors,,5 to 10 Year Old,,"Hi, we have an independent house/villa availab...","['1 Water Purifier', '5 Fan', '1 Exhaust Fan',...","['Private Garden / Terrace', 'Park', 'Visitor ...",
2,10 Bedroom House for sale in Sushant Lok Phase 1,,2.1 Crore,"₹ 38,251/sq.ft.",(51 sq.m.) Plot Area,Plot area 61(51 sq.m.),10 Bedrooms,10 Bathrooms,3+ Balconies,Servant Room,"Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,0 to 1 Year Old,"['Sector 42-43 metro station', 'Huda city cent...","Monthly rental income is rs1,40,000/- Best opt...","['10 Bed', '3 Fan', '10 Geyser', '2 Light', 'N...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."
3,21 Bedroom House for sale in Sector 54 Gurgaon,,5 Crore,"₹ 43,066/sq.ft.",(108 sq.m.) Plot Area,Plot area 129(107.86 sq.m.),21 Bedrooms,21 Bathrooms,3+ Balconies,Servant Room,"Sector 54 Gurgaon, Gurgaon, Haryana",5 Floors,North,1 to 5 Year Old,"['Sector 53-54 metro station', 'Sector 54 chow...","129 sq yd plot size. 5 floors built up , fully...","['1 Water Purifier', '21 Fan', '1 Fridge', '1 ...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment4 out of 5', 'Lifestyle5 out of 5..."
4,12 Bedroom House for sale in Sushant Lok Phase 1,,3 Crore,"₹ 53,763/sq.ft.",(52 sq.m.) Plot Area,Plot area 62(51.84 sq.m.),12 Bedrooms,12 Bathrooms,3+ Balconies,Others,"1228, Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,Within 6 months,"['Sector 42-43 metro station', 'Huda city cent...",Best for investment purpose. Fully furnished b...,"['1 Water Purifier', '1 Fridge', '12 Fan', '1 ...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."


In [27]:
df.price.value_counts()

3.5 Crore           19
5.5 Crore           17
6.5 Crore           16
6 Crore             14
5 Crore             13
4.5 Crore           13
70 Lac              13
8 Crore             13
50 Lac              13
75 Lac              13
8.5 Crore           12
7 Crore             12
85 Lac              12
1.5 Crore           11
4 Crore             11
10 Crore            10
Price on Request    10
45 Lac              10
2.25 Crore          10
2.5 Crore           10
60 Lac              10
90 Lac              10
9 Crore             10
9.5 Crore            9
12 Crore             9
80 Lac               9
1.7 Crore            9
2 Crore              9
1.1 Crore            9
1 Crore              8
6.75 Crore           8
11 Crore             8
1.6 Crore            8
4.6 Crore            8
1.3 Crore            7
95 Lac               7
12.5 Crore           7
3.75 Crore           7
1.2 Crore            7
55 Lac               7
2.1 Crore            7
65 Lac               7
40 Lac               7
1.35 Crore 

In [32]:
df[(df.price == 'Price on Request')]

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,num_floor,facing,age_possession,nearby_locations,description,furnish_details,features,rating
295,2 Bedroom House for sale in Sector 8 Gurgaon,,Price on Request,,(74 sq.m.) Built-up Area,Built Up area: 800 (74.32 sq.m.),2 Bedrooms,1 Bathroom,No Balcony,,"Sector 8 Gurgaon, Gurgaon, Haryana",1 Floors,,undefined,,"1 bath, semi-Furnished, at sector 8 location g...","['1 Light', 'No AC', 'No Bed', 'No Chimney', '...",,"['Environment4 out of 5', 'Lifestyle4 out of 5..."
296,3 Bedroom House for sale in Dharam Colony,,Price on Request,,(93 sq.m.) Carpet Area,Carpet area: 1000 (92.9 sq.m.),3 Bedrooms,2 Bathrooms,1 Balcony,,"Dharam Colony, Gurgaon, Haryana",2 Floors,,undefined,,"2 bath, unfurnished, at dharam colony location...",,,"['Environment4 out of 5', 'Lifestyle4 out of 5..."
325,5 Bedroom House for sale in Laxman Vihar,,Price on Request,,(167 sq.m.) Built-up Area,Built Up area: 1800 (167.23 sq.m.),5 Bedrooms,8 Bathrooms,3+ Balconies,,"Phase 2, Laxman Vihar, Gurgaon, Haryana",2 Floors,North,undefined,"['Chintapurni Mandir', 'Sheetla Mata Mandir', ...","8 bath, unfurnished, overlooking main road, no...",,,"['Environment4 out of 5', 'Lifestyle4 out of 5..."
326,3 Bedroom House for sale in Laxman Vihar,,Price on Request,,(223 sq.m.) Built-up Area,Built Up area: 2400 (222.97 sq.m.)Carpet area:...,3 Bedrooms,4 Bathrooms,2 Balconies,,"1248 B, Near Hanuman Mandir, Laxman Vihar, Gur...",2 Floors,,undefined,"['Chintapurni Mandir', 'Sheetla Mata Mandir', ...","4 bath, unfurnished, 1st floor (Of 2), 1 side ...",,,"['Environment4 out of 5', 'Lifestyle4 out of 5..."
402,7 Bedroom House for sale in Rajendra Park,,Price on Request,,(585 sq.m.) Built-up Area,Built Up area: 700 (585.29 sq.m.),7 Bedrooms,6 Bathrooms,3 Balconies,,"Rajendra Park, Gurgaon, Haryana",4 Floors,,5 to 10 Year Old,,"6 bath, furnished, 2 side open, at rajendra pa...","['1 Wardrobe', '1 Fan', '1 Light', 'No AC', 'N...",,"['Environment4 out of 5', 'Lifestyle4 out of 5..."
431,3 Bedroom House for sale in Ansal Plaza,,Price on Request,,(40 sq.m.) Carpet Area,Carpet area: 429 (39.86 sq.m.),3 Bedrooms,3 Bathrooms,3 Balconies,,"Ansal Plaza, Sector 23, Ansal Plaza, Gurgaon, ...",4 Floors,,undefined,,Best in class property available at ansal plaz...,,,"['Environment5 out of 5', 'Lifestyle5 out of 5..."
494,2 Bedroom House for sale in Sheetla Colony,,Price on Request,,(42 sq.m.) Plot Area,Plot area 50(41.81 sq.m.)Built Up area: 720 sq...,2 Bedrooms,2 Bathrooms,1 Balcony,,"Sheetla Colony, Gurgaon, Haryana",2 Floors,,undefined,,"2 bath, semi-Furnished, at sheetla colony loca...","['1 Light', 'No AC', 'No Bed', 'No Chimney', '...",,"['Environment3 out of 5', 'Lifestyle3 out of 5..."
569,5 Bedroom House for sale in Surat Nagar,,Price on Request,,(54 sq.m.) Built-up Area,Built Up area: 65 (54.35 sq.m.),5 Bedrooms,2 Bathrooms,No Balcony,,"Surat Nagar Phase 2, Sector 104, Surat Nagar, ...",2 Floors,,undefined,,5bhk residential house for resale in surat nag...,,,"['Environment3 out of 5', 'Lifestyle3 out of 5..."
595,2 Bedroom House for sale in Dharam Colony Block E,,Price on Request,,(84 sq.m.) Built-up Area,Built Up area: 900 (83.61 sq.m.),2 Bedrooms,1 Bathroom,No Balcony,,"Dharam Colony Block E, Gurgaon, Haryana",1 Floors,,undefined,"['Palam triangle', 'Palam Vihar Vyapar kendra'...","1 bath, unfurnished, ground floor (Of 1), at d...",,,
668,4 Bedroom House for sale in Madanpuri,,Price on Request,,(167 sq.m.) Carpet Area,Carpet area: 1800 (167.23 sq.m.),4 Bedrooms,2 Bathrooms,1 Balcony,,"Madanpuri, Gurgaon, Haryana",2 Floors,,undefined,,"2 bath, unfurnished, 1 side open, at madan pur...",,,"['Environment4 out of 5', 'Lifestyle4 out of 5..."


In [33]:
# remove all the rows in which the price is not mentioned
df = df[df.price != 'Price on Request']

In [36]:
def treat_price(x):
    """
    this function converts the price value into crores
    """
    if type(x) == float:
        return x
    else:
        if x[1] == 'Lac':
            return round(float(x[0])/100, 2)
        else:
            return round(float(x[0]), 2)

In [37]:
# apply the helper function to the price column
df.price = df.price.str.split(' ').apply(treat_price)
df.sample(10)

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,num_floor,facing,age_possession,nearby_locations,description,furnish_details,features,rating
1050,9 Bedroom House for sale in Sector 38 Gurgaon,sector 38 rwa,4.3,"₹ 28,782/sq.ft.",(139 sq.m.) Plot Area,Plot area 166(138.8 sq.m.)Built Up area: 165 s...,9 Bedrooms,9 Bathrooms,3+ Balconies,"Pooja Room,Others","166 Sq Yd, Stilt,lift,demand At 4.30 Cr, Secto...",3 Floors,East,1 to 5 Year Old,"['Rajiv Chowk Mosque', 'Icici bank ATM', 'Stat...",This is a residential house for sale in sector...,"['14 Wardrobe', '1 Water Purifier', '14 Fan', ...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment4 out of 5', 'Safety4 out of 5', ..."
756,4 Bedroom House for sale in DLF Phase 2,dlf city plots phase 2,10.5,"₹ 261,194/sq.ft.",(37 sq.m.) Plot Area,Plot area 402(37.35 sq.m.),4 Bedrooms,4 Bathrooms,2 Balconies,"Pooja Room,Servant Room","Lmn108, DLF Phase 2, Gurgaon, Haryana",2 Floors,East,10+ Year Old,"['Vodafone belvedere towers metro station', 'D...",It's an old house which is built on 402 sqyard...,"['7 Fan', '1 Exhaust Fan', '4 Geyser', '22 Lig...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Lifestyle5 out of 5..."
891,3 Bedroom House for sale in Sector 4 Gurgaon,,3.2,"₹ 14,222/sq.ft.",(209 sq.m.) Plot Area,Plot area 250(209.03 sq.m.),3 Bedrooms,3 Bathrooms,2 Balconies,,"Sector 4 Gurgaon, Gurgaon, Haryana",2 Floors,,10+ Year Old,"['Chintapurni Mandir', 'State bank ATM', 'Kr D...",Its a 250 sq yrds property located on main 18 ...,"['4 Fan', '13 Light', 'No AC', 'No Bed', 'No C...","['Maintenance Staff', 'Water Storage']","['Environment5 out of 5', 'Safety5 out of 5', ..."
282,36 Bedroom House for sale in West Rajiv Nagar,,2.25,"₹ 6,944/sq.ft.",(301 sq.m.) Plot Area,Plot area 360(301.01 sq.m.),36 Bedrooms,36 Bathrooms,2 Balconies,Servant Room,"1622, West Rajiv Nagar, Gurgaon, Haryana",3 Floors,East,5 to 10 Year Old,"['Sheetla Mata Mandir', 'Hanuman Mandir', 'Nid...",This property is having 36 rooms with attached...,[],['Water Storage'],"['Environment3 out of 5', 'Lifestyle4 out of 5..."
786,5 Bedroom House for sale in Sector 33 Gurgaon,unitech uniworld resorts,,,(435 sq.m.) Plot Area,Plot area 520(434.79 sq.m.),5 Bedrooms,8 Bathrooms,3+ Balconies,"Servant Room,Store Room","A-898, Sector 33 Gurgaon, Gurgaon, Haryana",4 Floors,West,1 to 5 Year Old,"['Rajiv Chowk Mosque', 'Icici bank ATM', 'Stan...",5 bhk 520 sqyd villas available at unitech uni...,"['5 Wardrobe', '15 Fan', '1 Exhaust Fan', '5 G...","['Private Garden / Terrace', 'High Ceiling Hei...","['Environment3 out of 5', 'Lifestyle4 out of 5..."
177,4 Bedroom House for sale in Sector 109 Gurgaon,international city by sobha phase 1,5.7,"₹ 10,556/sq.ft.",(502 sq.m.) Plot Area,Plot area 600(501.68 sq.m.),4 Bedrooms,4 Bathrooms,3+ Balconies,"Study Room,Servant Room","Phase2, Sector 109 Gurgaon, Gurgaon, Haryana",4 Floors,East,1 to 5 Year Old,"['Dwarka sector 21 metro station', 'Pacific D2...",Villa for rent / sale ecellent locatin\n Addit...,"['6 Fan', '6 Light', '1 Modular Kitchen', 'No ...","['Private Garden / Terrace', 'High Ceiling Hei...","['Environment5 out of 5', 'Lifestyle4 out of 5..."
972,9 Bedroom House for sale in C Block Sushant Lo...,,5.3,"₹ 27,390/sq.ft.",(180 sq.m.) Plot Area,Plot area 215(179.77 sq.m.),9 Bedrooms,9 Bathrooms,3+ Balconies,Servant Room,"C Block, C Block Sushant Lok Phase 1, Gurgaon,...",3 Floors,East,5 to 10 Year Old,"['Sector 42-43 metro station', 'Huda city cent...",This property is available at c block with eas...,"['9 Wardrobe', '15 Fan', '1 Exhaust Fan', '12 ...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment4 out of 5', 'Safety4 out of 5', ..."
86,5 Bedroom House for sale in Sector 66 Gurgaon,emaar mgf marbella,,"₹ 19,708/sq.ft.",(606 sq.m.) Built-up Area,,,,,,"Sector 66 Gurgaon, Gurgaon, Haryana",,,,"['Sector 55-56 Rapid Metro Station', 'HUB 66',...","Emaar mgf marbella in sector-66, gurgaon by em...",,,"['Environment3 out of 5', 'Lifestyle4 out of 5..."
1003,12 Bedroom House for sale in Uppals Southend,uppal southend,6.75,"₹ 290,948/sq.ft.",(22 sq.m.) Plot Area,Plot area 232(21.55 sq.m.),12 Bedrooms,12 Bathrooms,3+ Balconies,"Pooja Room,Study Room,Servant Room,Others","Uppals Southend, Gurgaon, Haryana",,West,5 to 10 Year Old,"['Sri Radhe Krishna Temple', 'Icici bank ATM',...",Address... Uppal southend sector 49 s block si...,"['22 Wardrobe', '24 Fan', '1 Exhaust Fan', '33...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Safety5 out of 5', ..."
621,3 Bedroom House for sale in Ashok Vihar,,0.9,"₹ 10,000/sq.ft.",(84 sq.m.) Plot Area,Plot area 900(83.61 sq.m.)Built Up area: 3500 ...,3 Bedrooms,4 Bathrooms,3 Balconies,Others,"Phase 3 Extn., Ashok Vihar, Gurgaon, Haryana",3 Floors,,5 to 10 Year Old,"['Palam Vihar Vyapar kendra', 'Palam triangle'...",L shape plot. Commercial cum residential const...,"['1 Bed', '5 Wardrobe', '1 Water Purifier', '4...","['Feng Shui / Vaastu Compliant', 'Water Storag...","['Environment4 out of 5', 'Lifestyle4 out of 5..."


In [38]:
# rename the columns so that they are consistent with the flats dataset
df.rename(columns={'price_per_sqft':'area_type', 'rate':'price_per_sqft'}, inplace=True)
df.head()

Unnamed: 0,property_name,society,price,price_per_sqft,area_type,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,num_floor,facing,age_possession,nearby_locations,description,furnish_details,features,rating
0,5 Bedroom House for sale in Sector 70A Gurgaon,bptp visionnaire,5.25,"₹ 20,115/sq.ft.",(242 sq.m.) Plot Area,Plot area 290(242.48 sq.m.),5 Bedrooms,4 Bathrooms,3+ Balconies,Servant Room,"29b, Sector 70A Gurgaon, Gurgaon, Haryana",3 Floors,North-East,0 to 1 Year Old,"['Good Earth City Center 2', 'Kunskapsskolan I...",Do you wish to buy an independent house in sec...,"['1 Wardrobe', '1 Fan', '1 Exhaust Fan', '1 Ge...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Lifestyle4 out of 5..."
1,5 Bedroom House for sale in Sector 21A Faridabad,,5.7,"₹ 105,751/sq.ft.",(50 sq.m.) Plot Area,Plot area 539(50.07 sq.m.),5 Bedrooms,4 Bathrooms,2 Balconies,"Store Room,Pooja Room,Servant Room","Sector 21A Faridabad, Gurgaon, Haryana",2 Floors,,5 to 10 Year Old,,"Hi, we have an independent house/villa availab...","['1 Water Purifier', '5 Fan', '1 Exhaust Fan',...","['Private Garden / Terrace', 'Park', 'Visitor ...",
2,10 Bedroom House for sale in Sushant Lok Phase 1,,2.1,"₹ 38,251/sq.ft.",(51 sq.m.) Plot Area,Plot area 61(51 sq.m.),10 Bedrooms,10 Bathrooms,3+ Balconies,Servant Room,"Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,0 to 1 Year Old,"['Sector 42-43 metro station', 'Huda city cent...","Monthly rental income is rs1,40,000/- Best opt...","['10 Bed', '3 Fan', '10 Geyser', '2 Light', 'N...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."
3,21 Bedroom House for sale in Sector 54 Gurgaon,,5.0,"₹ 43,066/sq.ft.",(108 sq.m.) Plot Area,Plot area 129(107.86 sq.m.),21 Bedrooms,21 Bathrooms,3+ Balconies,Servant Room,"Sector 54 Gurgaon, Gurgaon, Haryana",5 Floors,North,1 to 5 Year Old,"['Sector 53-54 metro station', 'Sector 54 chow...","129 sq yd plot size. 5 floors built up , fully...","['1 Water Purifier', '21 Fan', '1 Fridge', '1 ...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment4 out of 5', 'Lifestyle5 out of 5..."
4,12 Bedroom House for sale in Sushant Lok Phase 1,,3.0,"₹ 53,763/sq.ft.",(52 sq.m.) Plot Area,Plot area 62(51.84 sq.m.),12 Bedrooms,12 Bathrooms,3+ Balconies,Others,"1228, Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,Within 6 months,"['Sector 42-43 metro station', 'Huda city cent...",Best for investment purpose. Fully furnished b...,"['1 Water Purifier', '1 Fridge', '12 Fan', '1 ...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."


In [40]:
df.price_per_sqft.value_counts().head(5)

₹ 22,222/sq.ft.    14
₹ 11,111/sq.ft.    12
₹ 33,333/sq.ft.    11
₹ 10,000/sq.ft.    10
₹ 13,333/sq.ft.     7
Name: price_per_sqft, dtype: int64

In [41]:
# extract the float value of price per sqft
df.price_per_sqft = df.price_per_sqft.str.split('/').str.get(0).str.replace('₹','').str.replace(',','').str.strip().astype(float)
df.sample(5)

Unnamed: 0,property_name,society,price,price_per_sqft,area_type,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,num_floor,facing,age_possession,nearby_locations,description,furnish_details,features,rating
17,7 Bedroom House for sale in Sector 38 Gurgaon,,2.1,23333.0,(84 sq.m.) Plot Area,Plot area 100(83.61 sq.m.),7 Bedrooms,7 Bathrooms,3+ Balconies,"Store Room,Pooja Room,Study Room","Sector 38 Gurgaon, Gurgaon, Haryana",3 Floors,North-East,1 to 5 Year Old,"['Rajiv Chowk Mosque', 'Icici bank ATM', 'Stat...",Stilt plus 3 floors. 4 year old construction. ...,,"['High Ceiling Height', 'Maintenance Staff', '...","['Environment4 out of 5', 'Lifestyle4 out of 5..."
1018,8 Bedroom House for sale in Sector 17 Gurgaon,,9.5,23457.0,(420 sq.m.) Plot Area,Plot area 502(419.74 sq.m.)Built Up area: 500 ...,8 Bedrooms,8 Bathrooms,3 Balconies,Study Room,"Sector 17 Gurgaon, Gurgaon, Haryana",3 Floors,West,1 to 5 Year Old,"['Iffco chowk metro station', 'Citi bank ATM',...","House for sale plot size 502 sqyard 8 bedroom,...","['8 Wardrobe', '12 Fan', '1 Exhaust Fan', '8 G...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Safety5 out of 5', ..."
275,1 Bedroom House for sale in Ashok Vihar Phase ...,,0.85,8500.0,(93 sq.m.) Built-up Area,Built Up area: 1000 (92.9 sq.m.),1 Bedroom,1 Bathroom,No Balcony,,"Ashok Vihar Phase 3, Block B, Ashok Vihar Phas...",1 Floors,,undefined,"['Palam Vihar Vyapar kendra', 'Palam triangle'...",Best 6 bhk independent house for modern-Day li...,,,"['Environment3 out of 5', 'Lifestyle4 out of 5..."
1021,5 Bedroom House for sale in Sector 106 Gurgaon,godrej meridien,5.6,14000.0,(372 sq.m.) Plot Area,Plot area 4000(371.61 sq.m.),5 Bedrooms,4 Bathrooms,3+ Balconies,"Pooja Room,Study Room,Servant Room,Store Room","Aa1, Sector 106 Gurgaon, Gurgaon, Haryana",33 Floors,North-East,Within 6 months,"['Huda metro station', 'Gurgaon Dreamz Mall', ...",Sector 106 gurgaon is one of gurgaon's most so...,"['1 Wardrobe', '1 Fan', '1 Geyser', '1 Light',...","['Centrally Air Conditioned', 'Water purifier'...",
216,5 Bedroom House for sale in Sohna Road,prem kunj,0.5,7407.0,(63 sq.m.) Plot Area,Plot area 675(62.71 sq.m.)Built Up area: 725 s...,5 Bedrooms,4 Bathrooms,3 Balconies,Pooja Room,"Opp.Kiit College, Sohna Road, Gurgaon, Haryana",3 Floors,South-West,1 to 5 Year Old,"['Rajiv Chowk Mosque', 'Standard chartered ATM...",Seprated entry from road.Locked colony by gate...,,"['Water Storage', 'Park', 'Bank Attached Prope...",


In [42]:
df.bedrooms.isnull().sum()

100

In [43]:
df[df.bedrooms.isnull()]

Unnamed: 0,property_name,society,price,price_per_sqft,area_type,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,num_floor,facing,age_possession,nearby_locations,description,furnish_details,features,rating
60,4 Bedroom House for sale in Sector 86 Gurgaon,dlf new town heights,,7718.0,(297 sq.m.) Plot Area,,,,,,,,,,,,,,
61,8 Bedroom House for sale in B1 Block Sector 57...,,,25535.0,(135 sq.m.) Plot Area,,,,,,,,,,,,,,
62,6 Bedroom House for sale in DLF Phase 1,,,1859.0,(420 sq.m.) Plot Area,,,,,,,,,,,,,,
63,6 Bedroom House for sale in Sushant Lok Phase 3,ansal sushant residency,,17037.0,(251 sq.m.) Plot Area,,,,,,,,,,,,,,
64,6 Bedroom House for sale in Sushant Lok Phase 3,ansals florence villa,,10579.0,(321 sq.m.) Plot Area,,,,,,,,,,,,,,
65,4 Bedroom House for sale in DLF Phase 4,,,42194.0,(264 sq.m.) Plot Area,,,,,,,,,,,,,,
66,8 Bedroom House for sale in Uppals Southend,,,15625.0,(268 sq.m.) Plot Area,,,,,,,,,,,,,,
67,6 Bedroom House for sale in Uppals Southend,uppal southend,,15278.0,(268 sq.m.) Plot Area,,,,,,,,,,,,,,
68,4 Bedroom House for sale in Sector 48 Gurgaon,vipul tatvam villa,,201388.0,(33 sq.m.) Plot Area,,,,,,,,,,,,,,
69,4 Bedroom House for sale in Malibu Town,,,17187.0,(54 sq.m.) Plot Area,,,,,,,,,,,,,,


In [44]:
# as the rows containing null values in bedroom have null in other columns too, drop them
df = df[~df.bedrooms.isnull()]

In [45]:
# extract the integer value from bedrooms
df.bedrooms = df.bedrooms.str.split(' ').str.get(0).astype('int')
df.head()

Unnamed: 0,property_name,society,price,price_per_sqft,area_type,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,num_floor,facing,age_possession,nearby_locations,description,furnish_details,features,rating
0,5 Bedroom House for sale in Sector 70A Gurgaon,bptp visionnaire,5.25,20115.0,(242 sq.m.) Plot Area,Plot area 290(242.48 sq.m.),5,4 Bathrooms,3+ Balconies,Servant Room,"29b, Sector 70A Gurgaon, Gurgaon, Haryana",3 Floors,North-East,0 to 1 Year Old,"['Good Earth City Center 2', 'Kunskapsskolan I...",Do you wish to buy an independent house in sec...,"['1 Wardrobe', '1 Fan', '1 Exhaust Fan', '1 Ge...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Lifestyle4 out of 5..."
1,5 Bedroom House for sale in Sector 21A Faridabad,,5.7,105751.0,(50 sq.m.) Plot Area,Plot area 539(50.07 sq.m.),5,4 Bathrooms,2 Balconies,"Store Room,Pooja Room,Servant Room","Sector 21A Faridabad, Gurgaon, Haryana",2 Floors,,5 to 10 Year Old,,"Hi, we have an independent house/villa availab...","['1 Water Purifier', '5 Fan', '1 Exhaust Fan',...","['Private Garden / Terrace', 'Park', 'Visitor ...",
2,10 Bedroom House for sale in Sushant Lok Phase 1,,2.1,38251.0,(51 sq.m.) Plot Area,Plot area 61(51 sq.m.),10,10 Bathrooms,3+ Balconies,Servant Room,"Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,0 to 1 Year Old,"['Sector 42-43 metro station', 'Huda city cent...","Monthly rental income is rs1,40,000/- Best opt...","['10 Bed', '3 Fan', '10 Geyser', '2 Light', 'N...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."
3,21 Bedroom House for sale in Sector 54 Gurgaon,,5.0,43066.0,(108 sq.m.) Plot Area,Plot area 129(107.86 sq.m.),21,21 Bathrooms,3+ Balconies,Servant Room,"Sector 54 Gurgaon, Gurgaon, Haryana",5 Floors,North,1 to 5 Year Old,"['Sector 53-54 metro station', 'Sector 54 chow...","129 sq yd plot size. 5 floors built up , fully...","['1 Water Purifier', '21 Fan', '1 Fridge', '1 ...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment4 out of 5', 'Lifestyle5 out of 5..."
4,12 Bedroom House for sale in Sushant Lok Phase 1,,3.0,53763.0,(52 sq.m.) Plot Area,Plot area 62(51.84 sq.m.),12,12 Bathrooms,3+ Balconies,Others,"1228, Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,Within 6 months,"['Sector 42-43 metro station', 'Huda city cent...",Best for investment purpose. Fully furnished b...,"['1 Water Purifier', '1 Fridge', '12 Fan', '1 ...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."


In [46]:
df.balconies.value_counts()

3+ Balconies    365
2 Balconies     220
3 Balconies     159
No Balcony      115
1 Balcony       105
Name: balconies, dtype: int64

In [47]:
# extract the integer values from bathrooms and balconies columns
df.bathrooms = df.bathrooms.str.split(' ').str.get(0).astype('int')
df.balconies = df.balconies.str.split(' ').str.get(0).str.replace('No', '0')
df.head()

Unnamed: 0,property_name,society,price,price_per_sqft,area_type,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,num_floor,facing,age_possession,nearby_locations,description,furnish_details,features,rating
0,5 Bedroom House for sale in Sector 70A Gurgaon,bptp visionnaire,5.25,20115.0,(242 sq.m.) Plot Area,Plot area 290(242.48 sq.m.),5,4,3+,Servant Room,"29b, Sector 70A Gurgaon, Gurgaon, Haryana",3 Floors,North-East,0 to 1 Year Old,"['Good Earth City Center 2', 'Kunskapsskolan I...",Do you wish to buy an independent house in sec...,"['1 Wardrobe', '1 Fan', '1 Exhaust Fan', '1 Ge...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Lifestyle4 out of 5..."
1,5 Bedroom House for sale in Sector 21A Faridabad,,5.7,105751.0,(50 sq.m.) Plot Area,Plot area 539(50.07 sq.m.),5,4,2,"Store Room,Pooja Room,Servant Room","Sector 21A Faridabad, Gurgaon, Haryana",2 Floors,,5 to 10 Year Old,,"Hi, we have an independent house/villa availab...","['1 Water Purifier', '5 Fan', '1 Exhaust Fan',...","['Private Garden / Terrace', 'Park', 'Visitor ...",
2,10 Bedroom House for sale in Sushant Lok Phase 1,,2.1,38251.0,(51 sq.m.) Plot Area,Plot area 61(51 sq.m.),10,10,3+,Servant Room,"Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,0 to 1 Year Old,"['Sector 42-43 metro station', 'Huda city cent...","Monthly rental income is rs1,40,000/- Best opt...","['10 Bed', '3 Fan', '10 Geyser', '2 Light', 'N...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."
3,21 Bedroom House for sale in Sector 54 Gurgaon,,5.0,43066.0,(108 sq.m.) Plot Area,Plot area 129(107.86 sq.m.),21,21,3+,Servant Room,"Sector 54 Gurgaon, Gurgaon, Haryana",5 Floors,North,1 to 5 Year Old,"['Sector 53-54 metro station', 'Sector 54 chow...","129 sq yd plot size. 5 floors built up , fully...","['1 Water Purifier', '21 Fan', '1 Fridge', '1 ...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment4 out of 5', 'Lifestyle5 out of 5..."
4,12 Bedroom House for sale in Sushant Lok Phase 1,,3.0,53763.0,(52 sq.m.) Plot Area,Plot area 62(51.84 sq.m.),12,12,3+,Others,"1228, Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,Within 6 months,"['Sector 42-43 metro station', 'Huda city cent...",Best for investment purpose. Fully furnished b...,"['1 Water Purifier', '1 Fridge', '12 Fan', '1 ...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."


In [48]:
df.additional_room.value_counts()

Servant Room                                     81
Pooja Room,Study Room,Servant Room,Store Room    60
Others                                           58
Pooja Room                                       38
Pooja Room,Study Room,Servant Room               33
Pooja Room,Study Room,Servant Room,Others        32
Store Room                                       31
Pooja Room,Servant Room                          24
Study Room                                       19
Study Room,Servant Room                          19
Servant Room,Store Room                          15
Pooja Room,Study Room                            11
Pooja Room,Store Room                            11
Pooja Room,Others                                11
Servant Room,Pooja Room                           8
Servant Room,Others                               8
Pooja Room,Store Room,Study Room,Servant Room     8
Pooja Room,Servant Room,Store Room                7
Store Room,Servant Room                           6
Study Room,S

In [49]:
df.additional_room.isnull().sum()

386

In [50]:
# fill the null values in the additional_room column
df.additional_room.fillna('not available', inplace=True)
df.additional_room = df.additional_room.str.lower()
df.head()

Unnamed: 0,property_name,society,price,price_per_sqft,area_type,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,num_floor,facing,age_possession,nearby_locations,description,furnish_details,features,rating
0,5 Bedroom House for sale in Sector 70A Gurgaon,bptp visionnaire,5.25,20115.0,(242 sq.m.) Plot Area,Plot area 290(242.48 sq.m.),5,4,3+,servant room,"29b, Sector 70A Gurgaon, Gurgaon, Haryana",3 Floors,North-East,0 to 1 Year Old,"['Good Earth City Center 2', 'Kunskapsskolan I...",Do you wish to buy an independent house in sec...,"['1 Wardrobe', '1 Fan', '1 Exhaust Fan', '1 Ge...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Lifestyle4 out of 5..."
1,5 Bedroom House for sale in Sector 21A Faridabad,,5.7,105751.0,(50 sq.m.) Plot Area,Plot area 539(50.07 sq.m.),5,4,2,"store room,pooja room,servant room","Sector 21A Faridabad, Gurgaon, Haryana",2 Floors,,5 to 10 Year Old,,"Hi, we have an independent house/villa availab...","['1 Water Purifier', '5 Fan', '1 Exhaust Fan',...","['Private Garden / Terrace', 'Park', 'Visitor ...",
2,10 Bedroom House for sale in Sushant Lok Phase 1,,2.1,38251.0,(51 sq.m.) Plot Area,Plot area 61(51 sq.m.),10,10,3+,servant room,"Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,0 to 1 Year Old,"['Sector 42-43 metro station', 'Huda city cent...","Monthly rental income is rs1,40,000/- Best opt...","['10 Bed', '3 Fan', '10 Geyser', '2 Light', 'N...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."
3,21 Bedroom House for sale in Sector 54 Gurgaon,,5.0,43066.0,(108 sq.m.) Plot Area,Plot area 129(107.86 sq.m.),21,21,3+,servant room,"Sector 54 Gurgaon, Gurgaon, Haryana",5 Floors,North,1 to 5 Year Old,"['Sector 53-54 metro station', 'Sector 54 chow...","129 sq yd plot size. 5 floors built up , fully...","['1 Water Purifier', '21 Fan', '1 Fridge', '1 ...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment4 out of 5', 'Lifestyle5 out of 5..."
4,12 Bedroom House for sale in Sushant Lok Phase 1,,3.0,53763.0,(52 sq.m.) Plot Area,Plot area 62(51.84 sq.m.),12,12,3+,others,"1228, Sushant Lok Phase 1, Gurgaon, Haryana",5 Floors,West,Within 6 months,"['Sector 42-43 metro station', 'Huda city cent...",Best for investment purpose. Fully furnished b...,"['1 Water Purifier', '1 Fridge', '12 Fan', '1 ...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."


In [52]:
# rename the num floor column
df.rename(columns={'num_floor':'floor_num'}, inplace=True)
df.floor_num.value_counts()

3 Floors     304
2 Floors     288
1 Floors     181
4 Floors     136
5 Floors       9
0 Floors       6
14 Floors      3
6 Floors       3
11 Floors      2
12 Floors      2
10 Floors      2
16 Floors      1
51 Floors      1
41 Floors      1
27 Floors      1
20 Floors      1
13 Floors      1
21 Floors      1
02 Floors      1
33 Floors      1
Name: floor_num, dtype: int64

In [53]:
df[df.floor_num.isnull()]

Unnamed: 0,property_name,society,price,price_per_sqft,area_type,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,floor_num,facing,age_possession,nearby_locations,description,furnish_details,features,rating
23,4 Bedroom House for sale in Sector 48 Gurgaon,vipul tatvam villa,8.5,26235.0,(301 sq.m.) Plot Area,Plot area 360(301.01 sq.m.),4,4,2,"pooja room,servant room,store room","Sector 48 Gurgaon, Gurgaon, Haryana",,East,5 to 10 Year Old,"['Athena', 'Star Mall', 'The Sixth Element Sch...",Three side open villa in tatvam villa sector-4...,"['1 Chimney', '1 Modular Kitchen', 'No AC', 'N...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment4 out of 5', 'Lifestyle4 out of 5..."
51,8 Bedroom House for sale in Palam Vihar,,5.6,17284.0,(301 sq.m.) Plot Area,Plot area 360(301.01 sq.m.),8,6,3+,"pooja room,study room,servant room,store room","Palam Vihar, Gurgaon, Haryana",,South-West,5 to 10 Year Old,"['Palam Vihar Vyapar kendra', 'Palam triangle'...",360 sq. Yards plot area near by global foyer m...,"['1 Fan', '1 Dining Table', '1 Light', '1 Modu...",,"['Environment5 out of 5', 'Lifestyle5 out of 5..."
203,3 Bedroom House for sale in DLF Phase 3,,1.45,26852.0,(50 sq.m.) Plot Area,Plot area 60(50.17 sq.m.),3,3,1,not available,"DLF Phase 3, Gurgaon, Haryana",,,10+ Year Old,"['Dlf phase 3 metro station', 'Micromax moulsa...",Interested to sell independent house/villa.Pla...,,['Private Garden / Terrace'],"['Environment4 out of 5', 'Lifestyle5 out of 5..."
252,3 Bedroom House for sale in Ashok Vihar,,1.5,10288.0,(135 sq.m.) Plot Area,Plot area 162(135.45 sq.m.)Built Up area: 210 ...,3,3,0,not available,"800 Lane 8 Ashok Vihar Part 1, Ashok Vihar, Gu...",,,10+ Year Old,"['Chintapurni Mandir', 'Sheetla Mata Mandir', ...",Ground floor and partial first floor built up,[],,"['Environment4 out of 5', 'Lifestyle4 out of 5..."
270,2 Bedroom House for sale in Laxman Vihar Phase 2,,4.12,8889.0,(431 sq.m.) Plot Area,Plot area 515(430.61 sq.m.),2,1,3+,not available,"Laxman Vihar Phase 2, Gurgaon, Haryana",,,5 to 10 Year Old,"['Chintapurni Mandir', 'State bank ATM', 'Shre...","Property next to dhanwapur underpass, which is...",[],,
281,3 Bedroom House for sale in New Palam Vihar Ph...,,2.5,5472.0,(372 sq.m.) Plot Area,Plot area 4000(371.61 sq.m.),3,2,1,not available,"B-245, New Palam Vihar Phase 2, Gurgaon, Haryana",,,10+ Year Old,"['Palam Vihar Vyapar kendra', 'Palam triangle'...",100 mtr from dwarka express way. On 40ft road,,['Park'],
374,4 Bedroom House for sale in Laxman Vihar,,0.65,11111.0,(54 sq.m.) Plot Area,Plot area 65(54.35 sq.m.),4,2,2,not available,"Laxman Vihar, Gurgaon, Haryana",,,5 to 10 Year Old,"['Chintapurni Mandir', 'Sheetla Mata Mandir', ...",Well maintained two storeyed independent house...,"['1 Wardrobe', '1 Exhaust Fan', '10 Light', '1...",,"['Environment4 out of 5', 'Lifestyle4 out of 5..."
397,1 Bedroom House for sale in Sushant Lok Phase 1,ansal sushant lok plots,3.3,26570.0,(115 sq.m.) Plot Area,Plot area 138(115.39 sq.m.),1,1,0,not available,"Sushant Lok Phase 1, Gurgaon, Haryana",,,By 2027,"['Iffco chowk metro station', 'Huda city centr...","Close proximity to gold souk , huda city centr...",,,"['Environment5 out of 5', 'Lifestyle5 out of 5..."
417,2 Bedroom House for sale in Bhawani Enclave,,1.1,73333.0,(14 sq.m.) Plot Area,Plot area 150(13.94 sq.m.),2,2,1,others,"Bhawani Enclave, Gurgaon, Haryana",,,10+ Year Old,"['State bank ATM', 'Shri Multispeciality Hospi...","2 side open, 1 drawing room, 1 shop, 1 small r...","['1 Wardrobe', '1 Fan', '1 Light', 'No AC', 'N...",,
560,2 Bedroom House for sale in Jacobpura,jacob pura,0.35,9722.0,(33 sq.m.) Built-up Area,Built Up area: 360 (33.45 sq.m.),2,1,0,not available,"15/3, Jacobpura, Jacobpura, Gurgaon, Haryana",,,10+ Year Old,,Independece house for sale in jacobpura near k...,[],,"['Environment3 out of 5', 'Lifestyle4 out of 5..."


In [54]:
# extract the number value from the floor_num column
df.floor_num = df.floor_num.str.split(' ').str.get(0)
df.sample(10)

Unnamed: 0,property_name,society,price,price_per_sqft,area_type,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,floor_num,facing,age_possession,nearby_locations,description,furnish_details,features,rating
601,1 Bedroom House for sale in C Block Sushant Lo...,,3.35,26973.0,(115 sq.m.) Plot Area,Plot area 138(115.39 sq.m.),1,1,0,not available,"C Block Sushant Lok Phase 1, Gurgaon, Haryana",1,East,10+ Year Old,"['Sector 42-43 metro station', 'Huda city cent...","6-7 min walk to huda metro station, \n5 mins w...",,['Private Garden / Terrace'],"['Environment4 out of 5', 'Lifestyle4 out of 5..."
121,4 Bedroom House for sale in Nirvana Country,,10.45,38703.0,(251 sq.m.) Plot Area,Plot area 2700(250.84 sq.m.)Built Up area: 400...,4,5,2,"servant room,study room,pooja room","Espace Nirvana Country Gurgaon, Nirvana Countr...",3,North,5 to 10 Year Old,"['Radhakrishna Shani Mandir', 'Sri Radhe Krish...",4 bhk park facing prime location villa in \nNi...,"['8 Fan', '5 Geyser', '14 Light', '1 Modular K...","['Security / Fire Alarm', 'Feng Shui / Vaastu ...","['Environment5 out of 5', 'Lifestyle5 out of 5..."
126,3 Bedroom House for sale in Laxman Vihar Phase 2,,0.67,8557.0,(73 sq.m.) Plot Area,Plot area 87(72.74 sq.m.),3,2,1,"pooja room,others","Laxman Vihar Phase 2, Gurgaon, Haryana",1,South,5 to 10 Year Old,"['Chintapurni Mandir', 'Sheetla Mata Mandir', ...",Near by railways station near by market near b...,,"['Feng Shui / Vaastu Compliant', 'Water Storag...",
137,3 Bedroom House for sale in Sector 7 Gurgaon,,3.1,13778.0,(209 sq.m.) Plot Area,Plot area 250(209.03 sq.m.),3,3,2,not available,"Sector 7 Gurgaon, Gurgaon, Haryana",2,North-West,10+ Year Old,"['Chintapurni Mandir', 'State bank ATM', 'Dr. ...",250 square yards double story made 5 bhk house...,"['6 Wardrobe', '30 Light', 'No AC', 'No Bed', ...","['Park', 'Visitor Parking', 'Low Density Socie...","['Environment4 out of 5', 'Lifestyle4 out of 5..."
304,7 Bedroom House for sale in Lucknow,dlf garden city floors,4.0,17817.0,(209 sq.m.) Plot Area,Plot area 2245(208.57 sq.m.),7,7,3+,not available,"Lucknow, Gurgaon, Haryana",4,,0 to 1 Year Old,"['Sapphire 83 Mall', 'Dwarka Expressway', 'NH-...",I have a house/villa available for sale in dlf...,[],"['Feng Shui / Vaastu Compliant', 'Private Gard...",
408,1 Bedroom House for sale in Sector 3A Gurgaon,,0.37,7916.0,(45 sq.m.) Built-up Area,Built Up area: 480 (44.59 sq.m.),1,1,1,not available,"Laxman Vihar, Sector 3a, Gurgaon, Sector 3A Gu...",1,,1 to 5 Year Old,"['Chintapurni Mandir', 'State bank ATM', 'Prat...",Looking for a good 1 bhk independent floor in ...,,,"['Environment4 out of 5', 'Lifestyle4 out of 5..."
151,4 Bedroom House for sale in Sector 70A Gurgaon,bptp visionnaire,4.0,6666.0,(557 sq.m.) Plot Area,Plot area 6000(557.42 sq.m.),4,4,3+,servant room,"B 181, Sector 70A Gurgaon, Gurgaon, Haryana",2,North-East,1 to 5 Year Old,"['Good Earth City Center 2', 'Kunskapsskolan I...",Excellently connected via golf course ext. Roa...,,"['Centrally Air Conditioned', 'Water purifier'...","['Environment5 out of 5', 'Lifestyle4 out of 5..."
955,10 Bedroom House for sale in DLF Phase 3,,4.5,33333.0,(136 sq.m.) Plot Area,Plot area 163(136.29 sq.m.)Built Up area: 160 ...,10,8,3+,"store room,servant room","Dlf Phase 3, DLF Phase 3, Gurgaon, Haryana",4,East,1 to 5 Year Old,"['Dlf phase 3 metro station', 'Micromax moulsa...","Dlf phase 3 very prime location , this buildin...","['1 Water Purifier', '10 Fan', '1 Exhaust Fan'...","['Feng Shui / Vaastu Compliant', 'Maintenance ...","['Environment4 out of 5', 'Safety4 out of 5', ..."
143,4 Bedroom House for sale in Sector 109 Gurgaon,international city by sobha phase 2,6.8,12593.0,(502 sq.m.) Plot Area,Plot area 600(501.68 sq.m.),4,5,3,servant room,"128, Sector 109 Gurgaon, Gurgaon, Haryana",2,North-West,1 to 5 Year Old,"['Dwarka Sector 21 Metro Station', 'Pacific D2...",Very beautiful location and sobha internationa...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Lifestyle4 out of 5..."
13,5 Bedroom House for sale in DLF Phase 1,,15.0,33200.0,(420 sq.m.) Plot Area,Plot area 502(419.74 sq.m.),5,6,3+,"pooja room,study room,servant room,store room","A Block, DLF Phase 1, Gurgaon, Haryana",3,North,5 to 10 Year Old,"['Guru dronacharya metro station', 'Dlf phase ...",Genuine livable kothi at the rate of plot only...,"['5 Wardrobe', '9 Fan', '1 Exhaust Fan', '6 Ge...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Lifestyle5 out of 5..."


In [55]:
df.facing.value_counts()

East          178
North-East    158
North         109
West           75
North-West     44
South-East     39
South          34
South-West     24
Name: facing, dtype: int64

In [56]:
# check for null values in the facing column
df.facing.isnull().sum()

303

In [57]:
# fill the null values with NA
df.facing.fillna('NA', inplace=True)

In [58]:
# create new columns: area and property type
df.insert(loc=4, column='area', value=round((df.price*10000000)/df.price_per_sqft))
df.insert(loc=1, column='property_type', value='house')
df.head()

Unnamed: 0,property_name,property_type,society,price,price_per_sqft,area,area_type,areaWithType,bedrooms,bathrooms,balconies,additional_room,address,floor_num,facing,age_possession,nearby_locations,description,furnish_details,features,rating
0,5 Bedroom House for sale in Sector 70A Gurgaon,house,bptp visionnaire,5.25,20115.0,2610.0,(242 sq.m.) Plot Area,Plot area 290(242.48 sq.m.),5,4,3+,servant room,"29b, Sector 70A Gurgaon, Gurgaon, Haryana",3,North-East,0 to 1 Year Old,"['Good Earth City Center 2', 'Kunskapsskolan I...",Do you wish to buy an independent house in sec...,"['1 Wardrobe', '1 Fan', '1 Exhaust Fan', '1 Ge...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment5 out of 5', 'Lifestyle4 out of 5..."
1,5 Bedroom House for sale in Sector 21A Faridabad,house,,5.7,105751.0,539.0,(50 sq.m.) Plot Area,Plot area 539(50.07 sq.m.),5,4,2,"store room,pooja room,servant room","Sector 21A Faridabad, Gurgaon, Haryana",2,,5 to 10 Year Old,,"Hi, we have an independent house/villa availab...","['1 Water Purifier', '5 Fan', '1 Exhaust Fan',...","['Private Garden / Terrace', 'Park', 'Visitor ...",
2,10 Bedroom House for sale in Sushant Lok Phase 1,house,,2.1,38251.0,549.0,(51 sq.m.) Plot Area,Plot area 61(51 sq.m.),10,10,3+,servant room,"Sushant Lok Phase 1, Gurgaon, Haryana",5,West,0 to 1 Year Old,"['Sector 42-43 metro station', 'Huda city cent...","Monthly rental income is rs1,40,000/- Best opt...","['10 Bed', '3 Fan', '10 Geyser', '2 Light', 'N...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."
3,21 Bedroom House for sale in Sector 54 Gurgaon,house,,5.0,43066.0,1161.0,(108 sq.m.) Plot Area,Plot area 129(107.86 sq.m.),21,21,3+,servant room,"Sector 54 Gurgaon, Gurgaon, Haryana",5,North,1 to 5 Year Old,"['Sector 53-54 metro station', 'Sector 54 chow...","129 sq yd plot size. 5 floors built up , fully...","['1 Water Purifier', '21 Fan', '1 Fridge', '1 ...","['Feng Shui / Vaastu Compliant', 'Private Gard...","['Environment4 out of 5', 'Lifestyle5 out of 5..."
4,12 Bedroom House for sale in Sushant Lok Phase 1,house,,3.0,53763.0,558.0,(52 sq.m.) Plot Area,Plot area 62(51.84 sq.m.),12,12,3+,others,"1228, Sushant Lok Phase 1, Gurgaon, Haryana",5,West,Within 6 months,"['Sector 42-43 metro station', 'Huda city cent...",Best for investment purpose. Fully furnished b...,"['1 Water Purifier', '1 Fridge', '12 Fan', '1 ...","['Maintenance Staff', 'Water Storage', 'Visito...","['Environment5 out of 5', 'Lifestyle5 out of 5..."


In [59]:
# drop the redundant column area type
df.drop(columns=['area_type'], inplace=True)
df.shape

(964, 20)

In [60]:
df.isnull().sum()

property_name         0
property_type         0
society               0
price                19
price_per_sqft       19
area                 19
areaWithType          0
bedrooms              0
bathrooms             0
balconies             0
additional_room       0
address               5
floor_num            19
facing                0
age_possession        0
nearby_locations    116
description           0
furnish_details     235
features            302
rating              121
dtype: int64

In [61]:
# export the cleaned dataset to a csv file
df.to_csv('houses_cleaned.csv', index=False)