In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

In [14]:
import warnings
warnings.simplefilter(action='ignore', category=pd.errors.SettingWithCopyWarning)

In [2]:
pd.options.display.max_columns = None

In [3]:
df = pd.read_csv("data/final-imputed/final-full-imputed-v1.csv")
df.head(1)

Unnamed: 0,property_id,property_name,property_type,link,Society,Sector,City,address1,address2,PricePerUnit,area,Super Built Up,Built Up area,Carpet area,Plot Area,area_unit,bedRoom,bathroom,balcony,additionalRoom,Pooja Room,Servant Room,Store Room,Study Room,Other Room,facing,FloorNo,TotalFloors,Overlooking,Main Road,Park/Garden,Pool,Club,Overlook Others,agePossession,Flooring,GatedCommunity,Furnishing,CoveredParking,OpenParking,RoadFacing,WaterSource,24*7 Water,MuniCorp Water,Borewell/Tank,PowerBackup,WheelChairFriendly,PetFriendly,description,furnishDetails,Luxury Score,Facilities Categories,features,price
0,R76627967,7Bedrooms 7Baths,House/Villa,https://www.99acres.com/7-bhk-bedroom-independ...,,Sector 15 Chandigarh,Chandigarh,"Sector 15 Chandigarh, Chandigarh, India","Sector 15 Chandigarh, Chandigarh, India",15555.555556,Plot area 2000(1672.25 sq.m.) sq.yards,,18000.0,,18000.0,sq.yards,7,7,4,Servant Room,0,1,0,0,0,North-West,0,2,Others,0,0,0,0,1,Old,Marble,No,Semifurnished,3,3,40.0,"24*7 Water,Municipal corporation",1,1,0,No,Yes,Yes,This 7 bhk house for sale in sector 15 chandig...,"['4 Fan', '4 Light', 'No AC', 'No Bed', 'No Ch...",19,Standard,"['Feng Shui / Vaastu Compliant', 'Water purifi...",28.0


### Some Feature Engineering

In [4]:
df['TotalFloors'].value_counts().sort_index()

TotalFloors
0        7
1      553
2     2281
3     1609
4      679
5       98
6      196
7       99
8      142
9       86
10     150
11     116
12     284
13     376
14     333
15     195
16     200
17     338
18     115
19     127
20      21
21      64
22     118
23      56
24      34
25     109
26      10
27       1
28       2
30       8
32       2
33       9
34       2
35       1
42       7
43       1
Name: count, dtype: int64

In [5]:
def categorize_floor(floor):
    if floor <= 3:
        return 'Low-Rise'
    elif 4 <= floor <= 12:
        return 'Mid-Rise'
    elif 13 <= floor <= 40:
        return 'High-Rise'
    else:
        return 'Ultra-High-Rise'

In [6]:
df['TotalFloors'].apply(categorize_floor)

0       Low-Rise
1       Low-Rise
2       Low-Rise
3       Low-Rise
4       Low-Rise
          ...   
8424    Mid-Rise
8425    Mid-Rise
8426    Low-Rise
8427    Mid-Rise
8428    Mid-Rise
Name: TotalFloors, Length: 8429, dtype: object

In [7]:
df.insert(27,'FloorRise',value = df['TotalFloors'].apply(categorize_floor))

In [8]:
df.head(1)

Unnamed: 0,property_id,property_name,property_type,link,Society,Sector,City,address1,address2,PricePerUnit,area,Super Built Up,Built Up area,Carpet area,Plot Area,area_unit,bedRoom,bathroom,balcony,additionalRoom,Pooja Room,Servant Room,Store Room,Study Room,Other Room,facing,FloorNo,FloorRise,TotalFloors,Overlooking,Main Road,Park/Garden,Pool,Club,Overlook Others,agePossession,Flooring,GatedCommunity,Furnishing,CoveredParking,OpenParking,RoadFacing,WaterSource,24*7 Water,MuniCorp Water,Borewell/Tank,PowerBackup,WheelChairFriendly,PetFriendly,description,furnishDetails,Luxury Score,Facilities Categories,features,price
0,R76627967,7Bedrooms 7Baths,House/Villa,https://www.99acres.com/7-bhk-bedroom-independ...,,Sector 15 Chandigarh,Chandigarh,"Sector 15 Chandigarh, Chandigarh, India","Sector 15 Chandigarh, Chandigarh, India",15555.555556,Plot area 2000(1672.25 sq.m.) sq.yards,,18000.0,,18000.0,sq.yards,7,7,4,Servant Room,0,1,0,0,0,North-West,0,Low-Rise,2,Others,0,0,0,0,1,Old,Marble,No,Semifurnished,3,3,40.0,"24*7 Water,Municipal corporation",1,1,0,No,Yes,Yes,This 7 bhk house for sale in sector 15 chandig...,"['4 Fan', '4 Light', 'No AC', 'No Bed', 'No Ch...",19,Standard,"['Feng Shui / Vaastu Compliant', 'Water purifi...",28.0


### Final Cleaning

#### Sectors

##### Panchkula

In [9]:
df[df['City'] == 'Panchkula']['Sector'].value_counts()

Sector
Pinjore                  228
Sector 20 Panchkula      102
Peer Muchalla            100
Sector 15 Panchkula       77
Sector 21 Panchkula       76
Sector 7 Panchkula        58
Sector 4 Panchkula        53
Mansa Devi Complex        51
Sector 10 Panchkula       50
Sector 9 Panchkula        47
Sector 11 Panchkula       44
Sector 17 Panchkula       41
Sector 8 panchkula        40
Sector 2 Panchkula        36
Sector 12 A Panchkula     35
Sector 25 Panchkula       30
Sector 26 Panchkula       29
Sector 6 Panchkula        28
Sector 16 Panchkula       27
Sector 12 Panchkula       26
Sector 28 Panchkula       18
Zirakpur                  18
Sector 27 Panchkula       11
Sector 19 Panchkula        7
Sector 23 Panchkula        6
Sector 24 Panchkula        6
Sector 14 Panchkula        6
Kalka                      5
Sector 3 Panchkula         4
Sector 31 Panchkula        4
Sector 18 Panchkula        3
Chandi Mandir              2
Sector 29                  1
Ramgarh                    1
Name: c

In [12]:
### Sector 3 Panchkula - > Pinjore
temp_list = df[df['Sector'] == 'Sector 3 Panchkula'].index
df[df['Sector'] == 'Sector 3 Panchkula']

Unnamed: 0,property_id,property_name,property_type,link,Society,Sector,City,address1,address2,PricePerUnit,area,Super Built Up,Built Up area,Carpet area,Plot Area,area_unit,bedRoom,bathroom,balcony,additionalRoom,Pooja Room,Servant Room,Store Room,Study Room,Other Room,facing,FloorNo,FloorRise,TotalFloors,Overlooking,Main Road,Park/Garden,Pool,Club,Overlook Others,agePossession,Flooring,GatedCommunity,Furnishing,CoveredParking,OpenParking,RoadFacing,WaterSource,24*7 Water,MuniCorp Water,Borewell/Tank,PowerBackup,WheelChairFriendly,PetFriendly,description,furnishDetails,Luxury Score,Facilities Categories,features,price
1190,G75361261,4Bedrooms 4Baths,House/Villa,https://www.99acres.com/4-bhk-bedroom-independ...,,Sector 3 Panchkula,Panchkula,"Sector 3 Panchkula, Panchkula, Haryana","Sector 3 Panchkula, Panchkula, Haryana",10000.0,Plot area 2150(199.74 sq.m.) sq.ft.,,2150.0,,2150.0,sq.ft.,4,4,2,Servant Room,0,1,0,0,0,East,0,Mid-Rise,4,,0,0,0,0,0,New,Vitrified,No,Semifurnished,0,0,,,0,0,0,No,No,No,4-Bhk builder floor for sale in dlf valley pan...,"['3 Wardrobe', '1 Water Purifier', '4 Light', ...",0,Basic,[],2.15
1200,K76026541,6Bedrooms 6Baths,House/Villa,https://www.99acres.com/6-bhk-bedroom-independ...,DLF The Valley,Sector 3 Panchkula,Panchkula,"DLF The Valley, Sector 3 Panchkula, Panchkula,...","Sector 3 Panchkula, Panchkula, Haryana",20915.0,Plot area 1530(142.14 sq.m.) sq.ft.,,1530.0,,1530.0,sq.ft.,6,6,3,Others,0,0,0,0,1,North-West,0,Low-Rise,3,Main Road,1,0,0,0,0,RelNew,Marble,Yes,Unfurnished,1,1,30.0,,0,0,0,No,No,No,Looking for buyer to purchase our house/villa ...,,0,Basic,[],3.2
1494,K70879864,5Bedrooms 5Baths,House/Villa,https://www.99acres.com/5-bhk-bedroom-independ...,DLF The Valley,Sector 3 Panchkula,Panchkula,"DLF The Valley, Sector 3 Panchkula, Panchkula,...","Sector 3 Panchkula, Panchkula, Haryana",18843.333333,Plot area 171(142.98 sq.m.) sq.yards,,1539.0,,1539.0,sq.yards,5,5,4,Servant Room,0,1,0,0,0,South-East,0,Low-Rise,3,Main Road,1,0,0,0,0,New,Vitrified,No,Furnished,4,2,150.0,24*7 Water,1,0,0,Full,No,No,This 5 bhk independent house for sale in dlf v...,"['5 Wardrobe', '1 Exhaust Fan', '25 Light', '1...",44,Premium,"['Security / Fire Alarm', 'Private Garden / Te...",2.7
1495,Q74819217,5Bedrooms 5Baths,House/Villa,https://www.99acres.com/5-bhk-bedroom-independ...,DLF The Valley,Sector 3 Panchkula,Panchkula,"DLF The Valley, Sector 3 Panchkula, Panchkula,...","Sector 3 Panchkula, Panchkula, Haryana",9000.0,Built Up area: 3000 (278.71 sq.m.) sq.ft.,,3000.0,,,sq.ft.,5,5,4,Servant Room,0,1,0,0,0,East,0,Low-Rise,3,Main Road,1,0,0,0,0,New,Vitrified,No,Furnished,0,5,150.0,"24*7 Water,Borewell/Tank",1,0,1,Full,No,No,Fully finished independent villa in the heart ...,"['5 Wardrobe', '5 Light', '1 Modular Kitchen',...",9,Basic,"['Maintenance Staff', 'Water Storage', 'Park',...",2.7


In [18]:
for i in temp_list:
    df['Sector'].loc[i] = 'Pinjore'

In [19]:
df.loc[temp_list]

Unnamed: 0,property_id,property_name,property_type,link,Society,Sector,City,address1,address2,PricePerUnit,area,Super Built Up,Built Up area,Carpet area,Plot Area,area_unit,bedRoom,bathroom,balcony,additionalRoom,Pooja Room,Servant Room,Store Room,Study Room,Other Room,facing,FloorNo,FloorRise,TotalFloors,Overlooking,Main Road,Park/Garden,Pool,Club,Overlook Others,agePossession,Flooring,GatedCommunity,Furnishing,CoveredParking,OpenParking,RoadFacing,WaterSource,24*7 Water,MuniCorp Water,Borewell/Tank,PowerBackup,WheelChairFriendly,PetFriendly,description,furnishDetails,Luxury Score,Facilities Categories,features,price
1190,G75361261,4Bedrooms 4Baths,House/Villa,https://www.99acres.com/4-bhk-bedroom-independ...,,Pinjore,Panchkula,"Sector 3 Panchkula, Panchkula, Haryana","Sector 3 Panchkula, Panchkula, Haryana",10000.0,Plot area 2150(199.74 sq.m.) sq.ft.,,2150.0,,2150.0,sq.ft.,4,4,2,Servant Room,0,1,0,0,0,East,0,Mid-Rise,4,,0,0,0,0,0,New,Vitrified,No,Semifurnished,0,0,,,0,0,0,No,No,No,4-Bhk builder floor for sale in dlf valley pan...,"['3 Wardrobe', '1 Water Purifier', '4 Light', ...",0,Basic,[],2.15
1200,K76026541,6Bedrooms 6Baths,House/Villa,https://www.99acres.com/6-bhk-bedroom-independ...,DLF The Valley,Pinjore,Panchkula,"DLF The Valley, Sector 3 Panchkula, Panchkula,...","Sector 3 Panchkula, Panchkula, Haryana",20915.0,Plot area 1530(142.14 sq.m.) sq.ft.,,1530.0,,1530.0,sq.ft.,6,6,3,Others,0,0,0,0,1,North-West,0,Low-Rise,3,Main Road,1,0,0,0,0,RelNew,Marble,Yes,Unfurnished,1,1,30.0,,0,0,0,No,No,No,Looking for buyer to purchase our house/villa ...,,0,Basic,[],3.2
1494,K70879864,5Bedrooms 5Baths,House/Villa,https://www.99acres.com/5-bhk-bedroom-independ...,DLF The Valley,Pinjore,Panchkula,"DLF The Valley, Sector 3 Panchkula, Panchkula,...","Sector 3 Panchkula, Panchkula, Haryana",18843.333333,Plot area 171(142.98 sq.m.) sq.yards,,1539.0,,1539.0,sq.yards,5,5,4,Servant Room,0,1,0,0,0,South-East,0,Low-Rise,3,Main Road,1,0,0,0,0,New,Vitrified,No,Furnished,4,2,150.0,24*7 Water,1,0,0,Full,No,No,This 5 bhk independent house for sale in dlf v...,"['5 Wardrobe', '1 Exhaust Fan', '25 Light', '1...",44,Premium,"['Security / Fire Alarm', 'Private Garden / Te...",2.7
1495,Q74819217,5Bedrooms 5Baths,House/Villa,https://www.99acres.com/5-bhk-bedroom-independ...,DLF The Valley,Pinjore,Panchkula,"DLF The Valley, Sector 3 Panchkula, Panchkula,...","Sector 3 Panchkula, Panchkula, Haryana",9000.0,Built Up area: 3000 (278.71 sq.m.) sq.ft.,,3000.0,,,sq.ft.,5,5,4,Servant Room,0,1,0,0,0,East,0,Low-Rise,3,Main Road,1,0,0,0,0,New,Vitrified,No,Furnished,0,5,150.0,"24*7 Water,Borewell/Tank",1,0,1,Full,No,No,Fully finished independent villa in the heart ...,"['5 Wardrobe', '5 Light', '1 Modular Kitchen',...",9,Basic,"['Maintenance Staff', 'Water Storage', 'Park',...",2.7


In [20]:
df[df['City'] == 'Panchkula']['Sector'].value_counts()

Sector
Pinjore                  232
Sector 20 Panchkula      102
Peer Muchalla            100
Sector 15 Panchkula       77
Sector 21 Panchkula       76
Sector 7 Panchkula        58
Sector 4 Panchkula        53
Mansa Devi Complex        51
Sector 10 Panchkula       50
Sector 9 Panchkula        47
Sector 11 Panchkula       44
Sector 17 Panchkula       41
Sector 8 panchkula        40
Sector 2 Panchkula        36
Sector 12 A Panchkula     35
Sector 25 Panchkula       30
Sector 26 Panchkula       29
Sector 6 Panchkula        28
Sector 16 Panchkula       27
Sector 12 Panchkula       26
Zirakpur                  18
Sector 28 Panchkula       18
Sector 27 Panchkula       11
Sector 19 Panchkula        7
Sector 23 Panchkula        6
Sector 24 Panchkula        6
Sector 14 Panchkula        6
Kalka                      5
Sector 31 Panchkula        4
Sector 18 Panchkula        3
Chandi Mandir              2
Sector 29                  1
Ramgarh                    1
Name: count, dtype: int64

In [21]:
df[df['Sector'] == 'Ramgarh']

Unnamed: 0,property_id,property_name,property_type,link,Society,Sector,City,address1,address2,PricePerUnit,area,Super Built Up,Built Up area,Carpet area,Plot Area,area_unit,bedRoom,bathroom,balcony,additionalRoom,Pooja Room,Servant Room,Store Room,Study Room,Other Room,facing,FloorNo,FloorRise,TotalFloors,Overlooking,Main Road,Park/Garden,Pool,Club,Overlook Others,agePossession,Flooring,GatedCommunity,Furnishing,CoveredParking,OpenParking,RoadFacing,WaterSource,24*7 Water,MuniCorp Water,Borewell/Tank,PowerBackup,WheelChairFriendly,PetFriendly,description,furnishDetails,Luxury Score,Facilities Categories,features,price
1206,F72432522,2Bedrooms 3Baths,House/Villa,https://www.99acres.com/2-bhk-bedroom-independ...,bhagat singh colony,Ramgarh,Panchkula,"bhagat singh colony, Ramgarh, Panchkula, Haryana","Ramgarh, Panchkula, Haryana",10000.0,Plot area 300(27.87 sq.m.) sq.ft.,,300.0,,300.0,sq.ft.,2,3,1,,0,0,0,0,0,East,0,Low-Rise,3,,0,0,0,0,0,ModOld,Vitrified,No,Unfurnished,0,1,,,0,0,0,No,No,No,Looking for buyer to purchase our house/villa ...,[],0,Basic,[],0.3


In [22]:
df.drop(1206,inplace = True)

In [23]:
df[df['Sector'] == 'Sector 29']

Unnamed: 0,property_id,property_name,property_type,link,Society,Sector,City,address1,address2,PricePerUnit,area,Super Built Up,Built Up area,Carpet area,Plot Area,area_unit,bedRoom,bathroom,balcony,additionalRoom,Pooja Room,Servant Room,Store Room,Study Room,Other Room,facing,FloorNo,FloorRise,TotalFloors,Overlooking,Main Road,Park/Garden,Pool,Club,Overlook Others,agePossession,Flooring,GatedCommunity,Furnishing,CoveredParking,OpenParking,RoadFacing,WaterSource,24*7 Water,MuniCorp Water,Borewell/Tank,PowerBackup,WheelChairFriendly,PetFriendly,description,furnishDetails,Luxury Score,Facilities Categories,features,price
1717,P76502167,5Bedrooms 4Baths,House/Villa,https://www.99acres.com/5-bhk-bedroom-independ...,Tribune Mitra Vihar,Sector 29,Panchkula,"Tribune Mitra Vihar, Sector 29, Panchkula, Har...","Sector 29, Panchkula, Haryana",19744.444444,Plot area 287(239.97 sq.m.) sq.yards,,2583.0,,2583.0,sq.yards,5,4,2,Pooja Room,1,0,0,0,0,East,0,Low-Rise,2,"Main Road,Park/Garden",1,1,0,0,0,Old,Marble,Yes,Unfurnished,2,0,9.0,,0,0,0,No,No,Yes,"East facing, corner plot, full of sunlight, so...",[],8,Basic,"['Private Garden / Terrace', 'Rain Water Harve...",5.4


In [24]:
df.drop(1717,inplace = True)

In [29]:
temp_list = df[(df['Sector'] == 'Zirakpur') & (df['City'] == 'Panchkula')].index
df[(df['Sector'] == 'Zirakpur') & (df['City'] == 'Panchkula')]

Unnamed: 0,property_id,property_name,property_type,link,Society,Sector,City,address1,address2,PricePerUnit,area,Super Built Up,Built Up area,Carpet area,Plot Area,area_unit,bedRoom,bathroom,balcony,additionalRoom,Pooja Room,Servant Room,Store Room,Study Room,Other Room,facing,FloorNo,FloorRise,TotalFloors,Overlooking,Main Road,Park/Garden,Pool,Club,Overlook Others,agePossession,Flooring,GatedCommunity,Furnishing,CoveredParking,OpenParking,RoadFacing,WaterSource,24*7 Water,MuniCorp Water,Borewell/Tank,PowerBackup,WheelChairFriendly,PetFriendly,description,furnishDetails,Luxury Score,Facilities Categories,features,price
5599,E76316503,3BHK 2Baths,Flat/Apartment,https://www.99acres.com/3-bhk-bedroom-apartmen...,,Zirakpur,Panchkula,"Sushma Elite Cross, Zirakpur, Panchkula, Haryana","Zirakpur, Panchkula, Haryana",4070.0,Carpet area: 1695 (157.47 sq.m.) sq.ft.,,2042.0,1695.0,,sq.ft.,3,2,4,Pooja Room,1,0,0,0,0,East,9,Mid-Rise,12,,0,0,0,0,0,RelNew,Vitrified,Yes,Unfurnished,2,0,,,0,0,0,Full,No,No,1685 sq ft \n1) north east facing door entranc...,,49,Premium,"['Security / Fire Alarm', 'Feng Shui / Vaastu ...",0.69
5608,C75923881,3BHK 3Baths,Flat/Apartment,https://www.99acres.com/3-bhk-bedroom-apartmen...,,Zirakpur,Panchkula,"Maya Garden city, Zirakpur, Panchkula, Haryana","Zirakpur, Panchkula, Haryana",3505.0,Carpet area: 1854 (172.24 sq.m.) sq.ft.,,2234.0,1854.0,,sq.ft.,3,3,4,Pooja Room,1,0,0,0,0,North-East,10,Mid-Rise,12,"Club,Main Road,Park/Garden",1,1,0,1,0,ModOld,Marble,Yes,Semifurnished,1,0,9.0,24*7 Water,1,0,0,Partial,No,No,Colony is located close to highway in zirakpur...,"['3 Wardrobe', '5 Fan', '1 Exhaust Fan', '3 Ge...",17,Standard,"['Security / Fire Alarm', 'Intercom Facility',...",0.65
5627,G76322227,3BHK 3Baths,Flat/Apartment,https://www.99acres.com/3-bhk-bedroom-apartmen...,,Zirakpur,Panchkula,"NORTHVIEW HOMEZ, Zirakpur, Panchkula, Haryana","Zirakpur, Panchkula, Haryana",5602.0,Super Built up area 1910(177.44 sq.m.) sq.ft.,1910.0,1616.0,,,sq.ft.,3,3,3,"Store Room,Study Room",0,0,1,1,0,East,3,Mid-Rise,12,"Club,Main Road,Park/Garden",1,1,0,1,0,UndConst,Vitrified,Yes,Semifurnished,0,1,100.0,24*7 Water,1,0,0,Full,Yes,Yes,Main on chandigarh - Delhi highway with mivan ...,"['1 Wardrobe', '1 Modular Kitchen', 'No AC', '...",38,Premium,"['Security / Fire Alarm', 'Lift(s)', 'Maintena...",1.07
5637,O76428669,3BHK 3Baths,Flat/Apartment,https://www.99acres.com/3-bhk-bedroom-apartmen...,,Zirakpur,Panchkula,"Beliston Avenue , Zirakpur, Panchkula, Haryana","Zirakpur, Panchkula, Haryana",4509.0,Super Built up area 1772(164.62 sq.m.) sq.ft.,1772.0,1499.0,,,sq.ft.,3,3,2,Pooja Room,1,0,0,0,0,North-East,8,Mid-Rise,10,"Club,Main Road,Others,Park/Garden,Pool",1,1,1,1,1,New,Vitrified,Yes,Semifurnished,1,0,40.0,"24*7 Water,Borewell/Tank,Municipal corporation",1,1,1,Full,Yes,Yes,This lovely 3 bhk apartment/flat in zirakpur i...,"['3 Wardrobe', '1 Modular Kitchen', 'No AC', '...",19,Standard,"['Feng Shui / Vaastu Compliant', 'Security / F...",0.799
5643,P76321891,3BHK 3Baths,Flat/Apartment,https://www.99acres.com/3-bhk-bedroom-apartmen...,,Zirakpur,Panchkula,"suman marvelous, Zirakpur, Panchkula, Haryana","Zirakpur, Panchkula, Haryana",4297.0,Carpet area: 1745 (162.12 sq.m.) sq.ft.,,2102.0,1745.0,,sq.ft.,3,3,3,,0,0,0,0,0,East,3,High-Rise,17,"Club,Main Road,Park/Garden",1,1,0,1,0,UndConst,Vitrified,Yes,Semifurnished,1,0,60.0,24*7 Water,1,0,0,Full,Yes,Yes,Location is good and very big size flat and cl...,"['3 Wardrobe', '1 Modular Kitchen', 'No AC', '...",39,Premium,"['Security / Fire Alarm', 'Feng Shui / Vaastu ...",0.75
5653,Q76353795,3BHK 3Baths,Builder Floor,https://www.99acres.com/3-bhk-bedroom-independ...,,Zirakpur,Panchkula,"Peermchulla, Zirakpur, Panchkula, Haryana","Zirakpur, Panchkula, Haryana",4949.0,Built Up area: 1300 (120.77 sq.m.)Carpet area:...,,1300.0,990.0,,sq.ft.,3,3,2,Servant Room,0,1,0,0,0,North,2,Low-Rise,3,"Main Road,Park/Garden",1,1,0,0,0,New,Ceramic,Yes,Semifurnished,1,1,35.0,"24*7 Water,Borewell/Tank",1,0,1,No,No,Yes,3 bhk flat 1300 sq ft with lift\nIn peermchull...,"['3 Wardrobe', '17 Light', 'No AC', 'No Bed', ...",7,Basic,"['Water Storage', 'Park', 'Visitor Parking', '...",0.49
5668,P76428881,3BHK 3Baths,Flat/Apartment,https://www.99acres.com/3-bhk-bedroom-apartmen...,,Zirakpur,Panchkula,"Beliston Avenue , Zirakpur, Panchkula, Haryana","Zirakpur, Panchkula, Haryana",4472.0,Super Built up area 1772(164.62 sq.m.) sq.ft.,1772.0,1499.0,,,sq.ft.,3,3,2,Pooja Room,1,0,0,0,0,North-East,8,Mid-Rise,10,"Club,Main Road,Others,Park/Garden,Pool",1,1,1,1,1,New,Vitrified,Yes,Semifurnished,1,0,40.0,"24*7 Water,Borewell/Tank,Municipal corporation",1,1,1,Full,Yes,Yes,"This beautiful 3 bhk flat in zirakpur, panchku...","['3 Wardrobe', '1 Modular Kitchen', 'No AC', '...",19,Standard,"['Feng Shui / Vaastu Compliant', 'Security / F...",0.7925
5669,T76428827,3BHK 3Baths,Flat/Apartment,https://www.99acres.com/3-bhk-bedroom-apartmen...,,Zirakpur,Panchkula,"Beliston Avenue , Zirakpur, Panchkula, Haryana","Zirakpur, Panchkula, Haryana",4503.0,Super Built up area 1772(164.62 sq.m.) sq.ft.,1772.0,1499.0,,,sq.ft.,3,3,2,Pooja Room,1,0,0,0,0,North-East,8,Mid-Rise,10,"Club,Main Road,Others,Park/Garden,Pool",1,1,1,1,1,New,Vitrified,Yes,Semifurnished,1,0,40.0,"24*7 Water,Borewell/Tank,Municipal corporation",1,1,1,Full,Yes,Yes,This 3 bhk apartment is available for sale in ...,"['3 Wardrobe', '1 Modular Kitchen', 'No AC', '...",19,Standard,"['Feng Shui / Vaastu Compliant', 'Security / F...",0.798
5670,Z76428761,3BHK 3Baths,Flat/Apartment,https://www.99acres.com/3-bhk-bedroom-apartmen...,,Zirakpur,Panchkula,"Beliston Avenue , Zirakpur, Panchkula, Haryana","Zirakpur, Panchkula, Haryana",4520.0,Built Up area: 1772 (164.62 sq.m.) sq.ft.,,1772.0,,,sq.ft.,3,3,2,Pooja Room,1,0,0,0,0,North-East,8,Mid-Rise,10,"Club,Main Road,Others,Park/Garden,Pool",1,1,1,1,1,New,Vitrified,Yes,Semifurnished,1,0,40.0,"24*7 Water,Borewell/Tank,Municipal corporation",1,1,1,Full,Yes,Yes,Located in the popular residential address of ...,"['3 Wardrobe', '1 Modular Kitchen', 'No AC', '...",19,Standard,"['Feng Shui / Vaastu Compliant', 'Security / F...",0.801
5714,S76428617,3BHK 3Baths,Flat/Apartment,https://www.99acres.com/3-bhk-bedroom-apartmen...,,Zirakpur,Panchkula,"Beliston Avenue , Zirakpur, Panchkula, Haryana","Zirakpur, Panchkula, Haryana",4458.0,Super Built up area 1772(164.62 sq.m.) sq.ft.,1772.0,1499.0,,,sq.ft.,3,3,2,Pooja Room,1,0,0,0,0,North-East,8,Mid-Rise,10,"Club,Main Road,Others,Park/Garden,Pool",1,1,1,1,1,New,Vitrified,Yes,Semifurnished,1,0,40.0,"24*7 Water,Borewell/Tank,Municipal corporation",1,1,1,Full,Yes,Yes,Check out this 3 bhk apartment for sale in bel...,"['3 Wardrobe', '1 Modular Kitchen', 'No AC', '...",19,Standard,"['Feng Shui / Vaastu Compliant', 'Security / F...",0.79


In [32]:
for i in temp_list:
    df['City'].loc[i] = 'Mohali'

In [34]:
df[df['City'] == 'Panchkula']['Sector'].value_counts()

Sector
Pinjore                  232
Sector 20 Panchkula      102
Peer Muchalla            100
Sector 15 Panchkula       77
Sector 21 Panchkula       76
Sector 7 Panchkula        58
Sector 4 Panchkula        53
Mansa Devi Complex        51
Sector 10 Panchkula       50
Sector 9 Panchkula        47
Sector 11 Panchkula       44
Sector 17 Panchkula       41
Sector 8 panchkula        40
Sector 2 Panchkula        36
Sector 12 A Panchkula     35
Sector 25 Panchkula       30
Sector 26 Panchkula       29
Sector 6 Panchkula        28
Sector 16 Panchkula       27
Sector 12 Panchkula       26
Sector 28 Panchkula       18
Sector 27 Panchkula       11
Sector 19 Panchkula        7
Sector 23 Panchkula        6
Sector 24 Panchkula        6
Sector 14 Panchkula        6
Kalka                      5
Sector 31 Panchkula        4
Sector 18 Panchkula        3
Chandi Mandir              2
Name: count, dtype: int64

##### Chandigarh

In [36]:
chd_ser = df[df['City'] == 'Chandigarh']['Sector'].value_counts()
chd_ser

Sector
Sector 21 Chandigarh    86
Sector 38 Chandigarh    79
Sector 49 Chandigarh    74
Sector 35 Chandigarh    72
Sector 48 Chandigarh    65
Sector 44 Chandigarh    64
Sector 15 Chandigarh    60
Sector 51 Chandigarh    56
Sector 8 Chandigarh     48
Sector 40 Chandigarh    47
Sector 18 Chandigarh    47
Sector 34 Chandigarh    46
Sector 33 Chandigarh    45
Sector 27 Chandigarh    40
Sector 43 Chandigarh    39
Sector 37 Chandigarh    36
Sector 19 Chandigarh    35
Sector 22 Chandigarh    34
Sector 50 Chandigarh    33
Manimajra               31
Sector 45 Chandigarh    30
Sector 20 Chandigarh    30
Sector 16 Chandigarh    29
Sector 46 Chandigarh    26
Sector 32 Chandigarh    26
Sector 36 Chandigarh    26
Sector 47 Chandigarh    24
Sector 42 Chandigarh    23
Sector 11 Chandigarh    22
Sector 28 Chandigarh    22
Sector 9 Chandigarh     17
Sector 23 Chandigarh    11
Sector 10 Chandigarh    11
Sector 39 Chandigarh    11
Naya Gaon                9
Sector 7 Chandigarh      8
Sector 2 Chandigarh  

Removing sectors with less than 4 listings.

In [40]:
temp_list = chd_ser[chd_ser < 4].index
temp_list

Index(['Ram Darbar Colony', 'Daddu Majra Colony', 'Hallo Majra',
       'Sector 4 Chandigarh', 'Maloya Colony', 'Sector 29 Chandigarh',
       'Sector 25 Chandigarh', 'Dhanas', 'Sector 5 Chandigarh'],
      dtype='object', name='Sector')

In [41]:
def sector_filt(sector):
    return df[df['Sector'] == sector][['Society','Sector','City']]

In [43]:
drop_rows = []
for i in temp_list:
    drop_rows += list(sector_filt(i).index)

In [46]:
df.drop(drop_rows,inplace = True)

In [47]:
df[df['City'] == 'Chandigarh']['Sector'].value_counts()

Sector
Sector 21 Chandigarh    86
Sector 38 Chandigarh    79
Sector 49 Chandigarh    74
Sector 35 Chandigarh    72
Sector 48 Chandigarh    65
Sector 44 Chandigarh    64
Sector 15 Chandigarh    60
Sector 51 Chandigarh    56
Sector 8 Chandigarh     48
Sector 18 Chandigarh    47
Sector 40 Chandigarh    47
Sector 34 Chandigarh    46
Sector 33 Chandigarh    45
Sector 27 Chandigarh    40
Sector 43 Chandigarh    39
Sector 37 Chandigarh    36
Sector 19 Chandigarh    35
Sector 22 Chandigarh    34
Sector 50 Chandigarh    33
Manimajra               31
Sector 45 Chandigarh    30
Sector 20 Chandigarh    30
Sector 16 Chandigarh    29
Sector 36 Chandigarh    26
Sector 32 Chandigarh    26
Sector 46 Chandigarh    26
Sector 47 Chandigarh    24
Sector 42 Chandigarh    23
Sector 11 Chandigarh    22
Sector 28 Chandigarh    22
Sector 9 Chandigarh     17
Sector 23 Chandigarh    11
Sector 10 Chandigarh    11
Sector 39 Chandigarh    11
Naya Gaon                9
Sector 7 Chandigarh      8
Sector 2 Chandigarh  

##### Mohali

In [49]:
pd.options.display.max_rows = None

In [50]:
df[df['City'] == 'Mohali']['Sector'].value_counts()

Sector
Zirakpur               1765
Kharar                  489
Sector 66 Mohali        285
Mullanpur               280
Aerocity                216
Sector 88 Mohali        216
Sector 127 Mohali       170
Sector 115 Mohali       160
New Chandigarh          146
Sector 91 Mohali        138
Sector 125 Mohali       133
Sector 82 Mohali        105
Sector 126 Mohali        96
Dera Bassi               90
Sector 117 Mohali        83
Phase 3 Mohali           65
Sector 85 Mohali         63
Sector 99 Mohali         63
Sector 71 Mohali         62
Sector 79 Mohali         61
Sector 70 Mohali         61
Sector 105 Mohali        60
Phase 7 Mohali           58
Sector 116 Mohali        57
Dhakoli                  53
Sector 80 Mohali         49
Phase 9 Mohali           48
Sector 89 Mohali         41
Sector 69 Mohali         38
Sector 110 Mohali        35
Phase 10 Mohali          33
Sector 65 Mohali         30
Sector 77 Mohali         29
Sector 74 Mohali         29
Sector 68 Mohali         26
Phase 4 Mohal

In [53]:
for i in sector_filt('Shivalik Vihar').index:
    df['Sector'].loc[i] = 'Sector 127 Mohali'

In [54]:
for i in sector_filt('TDI City').index:
    df['Sector'].loc[i] = 'Sector 118 Mohali'

In [55]:
for i in sector_filt('Sector 66b Mohali').index:
    df['Sector'].loc[i] = 'Sector 66 Mohali'

In [58]:
for i in sector_filt('Sector 82A Mohali').index:
    df['Sector'].loc[i] = 'Sector 82 Mohali'

In [60]:
for i in sector_filt('Ranjit Nagar').index:
    df['Sector'].loc[i] = 'Kharar'

In [61]:
df[df['City'] == 'Mohali']['Sector'].value_counts()

Sector
Zirakpur               1765
Kharar                  496
Sector 66 Mohali        304
Mullanpur               280
Aerocity                216
Sector 88 Mohali        216
Sector 127 Mohali       174
Sector 115 Mohali       160
New Chandigarh          146
Sector 91 Mohali        138
Sector 125 Mohali       133
Sector 82 Mohali        115
Sector 126 Mohali        96
Dera Bassi               90
Sector 117 Mohali        83
Phase 3 Mohali           65
Sector 85 Mohali         63
Sector 99 Mohali         63
Sector 71 Mohali         62
Sector 70 Mohali         61
Sector 79 Mohali         61
Sector 105 Mohali        60
Phase 7 Mohali           58
Sector 116 Mohali        57
Dhakoli                  53
Sector 80 Mohali         49
Phase 9 Mohali           48
Sector 89 Mohali         41
Sector 69 Mohali         38
Sector 110 Mohali        35
Phase 10 Mohali          33
Sector 65 Mohali         30
Sector 74 Mohali         29
Sector 77 Mohali         29
Phase 4 Mohali           26
Sector 124 Mo

### Export Data

In [63]:
df.to_csv("data/final-clean-data/data-with-extra-column-final.csv",index= False)

Data For Predictor Model (Removing Unnecessary Redundant Columns)

In [64]:
df.head(1)

Unnamed: 0,property_id,property_name,property_type,link,Society,Sector,City,address1,address2,PricePerUnit,area,Super Built Up,Built Up area,Carpet area,Plot Area,area_unit,bedRoom,bathroom,balcony,additionalRoom,Pooja Room,Servant Room,Store Room,Study Room,Other Room,facing,FloorNo,FloorRise,TotalFloors,Overlooking,Main Road,Park/Garden,Pool,Club,Overlook Others,agePossession,Flooring,GatedCommunity,Furnishing,CoveredParking,OpenParking,RoadFacing,WaterSource,24*7 Water,MuniCorp Water,Borewell/Tank,PowerBackup,WheelChairFriendly,PetFriendly,description,furnishDetails,Luxury Score,Facilities Categories,features,price
0,R76627967,7Bedrooms 7Baths,House/Villa,https://www.99acres.com/7-bhk-bedroom-independ...,,Sector 15 Chandigarh,Chandigarh,"Sector 15 Chandigarh, Chandigarh, India","Sector 15 Chandigarh, Chandigarh, India",15555.555556,Plot area 2000(1672.25 sq.m.) sq.yards,,18000.0,,18000.0,sq.yards,7,7,4,Servant Room,0,1,0,0,0,North-West,0,Low-Rise,2,Others,0,0,0,0,1,Old,Marble,No,Semifurnished,3,3,40.0,"24*7 Water,Municipal corporation",1,1,0,No,Yes,Yes,This 7 bhk house for sale in sector 15 chandig...,"['4 Fan', '4 Light', 'No AC', 'No Bed', 'No Ch...",19,Standard,"['Feng Shui / Vaastu Compliant', 'Water purifi...",28.0


In [65]:
df.drop(columns = ['property_id', 'property_name', 'link','Society','address1', 'address2','area','PricePerUnit',
                   'Super Built Up','Carpet area','Plot Area','area_unit','additionalRoom','TotalFloors','Overlooking','RoadFacing',
                   'WaterSource','description','furnishDetails','Luxury Score','features'],inplace = True)

In [67]:
df.rename(columns = {'Built Up area':'Area'},inplace = True)

In [68]:
df.head(1)

Unnamed: 0,property_type,Sector,City,Area,bedRoom,bathroom,balcony,Pooja Room,Servant Room,Store Room,Study Room,Other Room,facing,FloorNo,FloorRise,Main Road,Park/Garden,Pool,Club,Overlook Others,agePossession,Flooring,GatedCommunity,Furnishing,CoveredParking,OpenParking,24*7 Water,MuniCorp Water,Borewell/Tank,PowerBackup,WheelChairFriendly,PetFriendly,Facilities Categories,price
0,House/Villa,Sector 15 Chandigarh,Chandigarh,18000.0,7,7,4,0,1,0,0,0,North-West,0,Low-Rise,0,0,0,0,1,Old,Marble,No,Semifurnished,3,3,1,1,0,No,Yes,Yes,Standard,28.0


In [69]:
df.to_csv("data/final-clean-data/predictor-data-final.csv",index= False)