In [24]:
import numpy as np
import pandas as pd
from pathlib import Path

In [25]:
pd.set_option('display.max_rows', None)
pd.set_option('display.max_columns', None)

In [26]:
in_path = Path('../data/raw')
out_path = Path('../data/interim')

In [27]:
# Read the CSV file with the specified path
flats_1 = pd.read_csv(in_path / 'houses.csv')
flats_2 = pd.read_csv(in_path / 'flats_2.csv')

In [28]:
df = pd.concat([flats_1,flats_2],ignore_index=True)

In [29]:
df.shape

(7090, 22)

In [30]:
df.sample(5)

Unnamed: 0,property_name,link,society,price,rate,area,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
6622,2 BHK Flat in Bodakdev,https://www.99acres.com/2-bhk-bedroom-apartmen...,"31,Aastha Apartment,",70 Lac,,"₹ 5,833/sq.ft.",Carpet area: 1200 (111.48 sq.m.),2 Bedrooms,2 Bathrooms,1 Balcony,Others,"31, Aastha Apartment, Bodakdev, Opposite Sande...",,East,10+ Year Old,"['ISKON Temple', 'Paramdham Temple', 'State ba...",Its location is damn good. All necessary thing...,"['1 Water Purifier', '1 Fridge', '6 Fan', '1 E...",,"['Lifestyle4.1 out of 5', 'Safety4.2 out of 5'...",O69736064,3rd of 5 Floors
355,2 Bedroom House for sale in Khanpur,https://www.99acres.com/2-bhk-bedroom-independ...,,55 Lac,"₹ 6,011/sq.ft.",(85 sq.m.) Built-up Area,Built Up area: 85,2 Bedrooms,1 Bathroom,No Balcony,,"Khanpur, Khanpur, Ahmedabad East, Ahmedabad",1 Floors,,0 to 1 Year Old,['Ahmedabad Historic Gujari Bazaar Sunday Mark...,First floor residential 2bhk house for resale ...,"['1 Light', 'No AC', 'No Bed', 'No Chimney', '...",,,E69671076,
5322,4 BHK Flat in Chandkheda,https://www.99acres.com/4-bhk-bedroom-apartmen...,Devpriya,2.25 Crore,,"₹ 7,500/sq.ft.",Super Built up area 3000(278.71 sq.m.)Built Up...,4 Bedrooms,4 Bathrooms,1 Balcony,"Store Room,Pooja Room","Chandkheda, Ahmedabad North, Ahmedabad",,East,1 to 5 Year Old,"['Khodiyar Temple', 'State bank of india ATM',...",Devpriya is one of ahmedabad north's most soug...,,"['Feng Shui / Vaastu Compliant', 'Security / F...","['Lifestyle4.2 out of 5', 'Safety4.4 out of 5'...",I70878402,Ground of 7 Floors
6972,3 BHK Flat in Paldi,https://www.99acres.com/3-bhk-bedroom-apartmen...,Namo Hari Apartment,80 Lac,,"₹ 5,556/sq.ft.",Carpet area: 160 (133.78 sq.m.),3 Bedrooms,3 Bathrooms,No Balcony,,"Paldi, Ahmedabad West, Ahmedabad",,,10+ Year Old,['Shahi Masjid - Dargah Hazrat Ali Sher Bangal...,Uuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuu\n Addition...,,['Private Garden / Terrace'],"['Lifestyle4.3 out of 5', 'Safety4.4 out of 5'...",B58773978,2nd of 3 Floors
4042,2 BHK Flat in Satellite,https://www.99acres.com/2-bhk-bedroom-apartmen...,Viswanath Sharanam 8,1 Crore,,"₹ 8,889/sq.ft.",Built Up area: 125 (104.52 sq.m.),2 Bedrooms,2 Bathrooms,1 Balcony,,"Satellite, Ahmedabad West, Ahmedabad",,,10+ Year Old,"['Palam Vihar Vyapar kendra', 'Palam triangle'...",Residential apartment for sell.The property ha...,"['2 Wardrobe', '2 Bed', '2 Fan', '1 Fridge', '...","['Power Back-up', 'Feng Shui / Vaastu Complian...","['Lifestyle4.4 out of 5', 'Safety4.3 out of 5'...",C70048696,3rd of 5 Floors


In [31]:
# info
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 7090 entries, 0 to 7089
Data columns (total 22 columns):
 #   Column           Non-Null Count  Dtype 
---  ------           --------------  ----- 
 0   property_name    7090 non-null   object
 1   link             7090 non-null   object
 2   society          6031 non-null   object
 3   price            6834 non-null   object
 4   rate             2460 non-null   object
 5   area             7069 non-null   object
 6   areaWithType     6853 non-null   object
 7   bedRoom          6847 non-null   object
 8   bathroom         6853 non-null   object
 9   balcony          6853 non-null   object
 10  additionalRoom   3598 non-null   object
 11  address          6847 non-null   object
 12  noOfFloor        2403 non-null   object
 13  facing           4691 non-null   object
 14  agePossession    6853 non-null   object
 15  nearbyLocations  6141 non-null   object
 16  description      6885 non-null   object
 17  furnishDetails   4010 non-null   

In [32]:
# check for duplicates
df.drop_duplicates(subset='property_id',inplace=True)

In [33]:
df.duplicated().sum()

0

In [34]:
# check for missing values
df.isnull().sum()

property_name         0
link                  0
society            1056
price                51
rate               4182
area                 16
areaWithType         33
bedRoom              39
bathroom             33
balcony              33
additionalRoom     3125
address              34
noOfFloor          4239
facing             2097
agePossession        33
nearbyLocations     734
description           1
furnishDetails     2783
features           1681
rating              891
property_id           1
floorNum           2498
dtype: int64

In [35]:
# Columns to drop -> property_name, link, property_id
df.drop(columns=['link'], inplace=True)

In [36]:
df.head()

Unnamed: 0,property_name,society,price,rate,area,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual Bunglowe,1.25 Crore,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3 Bedrooms,3 Bathrooms,1 Balcony,Pooja Room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,Goyal Green Park,3 Crore,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4 Bedrooms,4 Bathrooms,2 Balconies,"Pooja Room,Study Room,Store Room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
2,3 Bedroom House for sale in Kasindra,Laxmi Residency,,,(156 sq.m.) Built-up Area,,,,,,"Kasindra, Ahmedabad South, Ahmedabad",,,,"['D Mart', 'NH 751', 'Shree SL Patel High Scho...",Laxmi residency is a residential development b...,,,,Y70193200,
3,2 Bedroom House for sale in Dhegam,Good Times By Sangath IPL,,,(64-87 sq.m.) Carpet Area,,,,,,"Dhegam, Gandhinagar, Ahmedabad",,,,,"Sangath good times in dhegam, gandhinagar & sa...",,,,X68471696,
4,5 Bedroom House for sale in Thaltej,Anurita Bungalows,,,(590 sq.m.) Super built-up Area,,,,,,"Thaltej, Ahmedabad West, Ahmedabad",,,,"['Shilaj Circle', 'Anand Niketan Campus', 'Sci...",Anurita is strategically located at thaltej-Sh...,,,"['Lifestyle4.5 out of 5', 'Connectivity4.3 out...",X70883980,


In [37]:
# rename columns
df.rename(columns={'area':'price_per_sqft'},inplace=True)
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual Bunglowe,1.25 Crore,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3 Bedrooms,3 Bathrooms,1 Balcony,Pooja Room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,Goyal Green Park,3 Crore,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4 Bedrooms,4 Bathrooms,2 Balconies,"Pooja Room,Study Room,Store Room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
2,3 Bedroom House for sale in Kasindra,Laxmi Residency,,,(156 sq.m.) Built-up Area,,,,,,"Kasindra, Ahmedabad South, Ahmedabad",,,,"['D Mart', 'NH 751', 'Shree SL Patel High Scho...",Laxmi residency is a residential development b...,,,,Y70193200,
3,2 Bedroom House for sale in Dhegam,Good Times By Sangath IPL,,,(64-87 sq.m.) Carpet Area,,,,,,"Dhegam, Gandhinagar, Ahmedabad",,,,,"Sangath good times in dhegam, gandhinagar & sa...",,,,X68471696,
4,5 Bedroom House for sale in Thaltej,Anurita Bungalows,,,(590 sq.m.) Super built-up Area,,,,,,"Thaltej, Ahmedabad West, Ahmedabad",,,,"['Shilaj Circle', 'Anand Niketan Campus', 'Sci...",Anurita is strategically located at thaltej-Sh...,,,"['Lifestyle4.5 out of 5', 'Connectivity4.3 out...",X70883980,


In [38]:
# society
df['society'].value_counts()

society
on request                                           105
On Request                                            80
Shaligram Prime                                       54
Olive Greens                                          43
Godrej Garden City4.2 ★                               43
Godrej Green Glades                                   33
On request                                            25
Madhav Oeuvre 2                                       24
Ganesh Housing Malabar County4.2 ★                    23
Swati Symphony                                        22
Nishant Ratnaakar Verte                               22
Sky Elegante                                          21
Savvy Swaraaj Sports Living3.8 ★                      21
upcoming new project                                  21
Saanvi Nirman Estella                                 18
Cloud 9                                               18
ON REQUEST                                            18
Casa Vyoma             

In [39]:
df['society'].value_counts().shape

(2923,)

In [40]:
import re
df['society'] = df['society'].apply(lambda name: re.sub(r'\d+(\.\d+)?\s?★', '', str(name)).strip()).str.lower()

In [41]:
df['society'].value_counts().shape

(2816,)

In [42]:
df['society'].value_counts()

society
nan                                                  1056
on request                                            236
shaligram prime                                        54
godrej garden city                                     45
olive greens                                           43
godrej green glades                                    33
ganesh housing malabar county                          24
madhav oeuvre 2                                        24
upcoming new project                                   22
sky elegante                                           22
swati symphony                                         22
nishant ratnaakar verte                                22
savvy swaraaj sports living                            21
saanvi nirman estella                                  18
cloud 9                                                18
nul                                                    17
casa vyoma                                             17
suryam

In [43]:
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual bunglowe,1.25 Crore,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3 Bedrooms,3 Bathrooms,1 Balcony,Pooja Room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,goyal green park,3 Crore,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4 Bedrooms,4 Bathrooms,2 Balconies,"Pooja Room,Study Room,Store Room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
2,3 Bedroom House for sale in Kasindra,laxmi residency,,,(156 sq.m.) Built-up Area,,,,,,"Kasindra, Ahmedabad South, Ahmedabad",,,,"['D Mart', 'NH 751', 'Shree SL Patel High Scho...",Laxmi residency is a residential development b...,,,,Y70193200,
3,2 Bedroom House for sale in Dhegam,good times by sangath ipl,,,(64-87 sq.m.) Carpet Area,,,,,,"Dhegam, Gandhinagar, Ahmedabad",,,,,"Sangath good times in dhegam, gandhinagar & sa...",,,,X68471696,
4,5 Bedroom House for sale in Thaltej,anurita bungalows,,,(590 sq.m.) Super built-up Area,,,,,,"Thaltej, Ahmedabad West, Ahmedabad",,,,"['Shilaj Circle', 'Anand Niketan Campus', 'Sci...",Anurita is strategically located at thaltej-Sh...,,,"['Lifestyle4.5 out of 5', 'Connectivity4.3 out...",X70883980,


In [44]:
# price
df['price'].value_counts()

price
45 Lac              171
55 Lac              164
65 Lac              156
75 Lac              152
60 Lac              143
70 Lac              115
50 Lac              109
40 Lac              101
85 Lac               98
1.5 Crore            93
1.1 Crore            90
95 Lac               89
35 Lac               89
80 Lac               87
30 Lac               84
1.25 Crore           76
90 Lac               73
2.5 Crore            67
1 Crore              61
25 Lac               61
3 Crore              61
42 Lac               60
1.4 Crore            60
1.3 Crore            58
2 Crore              58
1.35 Crore           53
3.5 Crore            52
68 Lac               50
1.2 Crore            49
32 Lac               48
58 Lac               48
52 Lac               46
1.75 Crore           45
2.25 Crore           45
48 Lac               45
1.15 Crore           45
72 Lac               43
1.05 Crore           43
1.6 Crore            42
5 Crore              40
38 Lac               40
28 Lac    

In [45]:
df[df['price'] == 'Price on Request']

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
176,3 Bedroom House for sale in Paldi,,Price on Request,,(286 sq.m.) Built-up Area,Built Up area: 342 (285.96 sq.m.),3 Bedrooms,4 Bathrooms,No Balcony,,"Paldi, Paldi, Ahmedabad West, Ahmedabad",2 Floors,,undefined,,3bhk residential house for resale in paldi paldi,"['1 Light', 'No AC', 'No Bed', 'No Chimney', '...",,"['Lifestyle4.3 out of 5', 'Connectivity4.4 out...",N70671330,
443,2 Bedroom House for sale in Shahibaug,,Price on Request,,(142 sq.m.) Built-up Area,Built Up area: 170 (142.14 sq.m.),2 Bedrooms,2 Bathrooms,1 Balcony,,"Shahibuag, Shahibaug, Ahmedabad East, Ahmedabad",1 Floors,,undefined,,2bhk residential house for rent in shahibuag s...,"['1 Light', 'No AC', 'No Bed', 'No Chimney', '...",,"['Lifestyle4.3 out of 5', 'Connectivity4.3 out...",H69220790,
1691,4 Bedroom House for sale in Sabarmati,,Price on Request,,(257 sq.m.) Built-up Area,Built Up area: 257,4 Bedrooms,4 Bathrooms,No Balcony,,"Sabarmati, Sabarmati, Ahmedabad North, Ahmedabad",2 Floors,,undefined,,4bhk residential house for resale in sabarmati...,"['1 Wardrobe', '1 Fan', '1 Light', 'No AC', 'N...",,"['Lifestyle3.7 out of 5', 'Connectivity3.9 out...",M70778912,
1717,3 Bedroom House for sale in Bapunagar,bapunagar one,Price on Request,,(293 sq.m.) Built-up Area,Built Up area: 350 (292.64 sq.m.),3 Bedrooms,1 Bathroom,No Balcony,,"Bapunagar, Bapunagar, Ahmedabad East, Ahmedabad",1 Floors,,undefined,,3bhk residential house for resale in bapunagar...,,,"['Lifestyle3.9 out of 5', 'Connectivity4.1 out...",Z70735232,
1737,2 Bedroom House for sale in Nikol,,Price on Request,,(9 sq.m.) Built-up Area,Built Up area: 100 (9.29 sq.m.),2 Bedrooms,2 Bathrooms,1 Balcony,,"Nikol Naroda Road, Nikol, Ahmedabad East, Ahme...",1 Floors,,undefined,,"2 bath, unfurnished, 1st floor (Of 1), 2 side ...",,,"['Lifestyle4.4 out of 5', 'Connectivity4.3 out...",M70694008,
1740,3 Bedroom House for sale in Vasna,trilokesh riverside park,Price on Request,,(106 sq.m.) Built-up Area,Built Up area: 127 (106.19 sq.m.),3 Bedrooms,1 Bathroom,No Balcony,,"Vasna, Vasna, Ahmedabad West, Ahmedabad",1 Floors,,undefined,,3bhk residential house for resale in riverside...,,,"['Lifestyle4 out of 5', 'Connectivity4.1 out o...",W70692688,
1771,2 Bedroom House for sale in D Cabin,,Price on Request,,(11 sq.m.) Built-up Area,Built Up area: 115 (10.68 sq.m.),2 Bedrooms,2 Bathrooms,1 Balcony,,"D Cabin, Chandkheda, D Cabin, Ahmedabad North,...",1 Floors,North,undefined,,2 bhk duplex row-House in well maintained soci...,"['1 Wardrobe', '1 Fan', '1 Light', 'No AC', 'N...",,"['Lifestyle3.7 out of 5', 'Connectivity3.8 out...",K70617864,
2106,4 Bedroom House for sale in Bopal,,Price on Request,,(337 sq.m.) Built-up Area,Built Up area: 3630 (337.24 sq.m.),4 Bedrooms,4 Bathrooms,3 Balconies,,"Ambli Bopal Road, Bopal, Ahmedabad West, Ahmed...",14 Floors,,undefined,,4bhk penthouse for resale in ambli bopal road ...,,,"['Lifestyle4.2 out of 5', 'Connectivity4.3 out...",C69555368,
2226,3 Bedroom House for sale in Kasindra,,Price on Request,,(186 sq.m.) Built-up Area,Built Up area: 2000 (185.81 sq.m.),3 Bedrooms,1 Bathroom,No Balcony,,"Kasindra, Kasindra, Ahmedabad South, Ahmedabad",1 Floors,,undefined,,Best in class property available at kasindra l...,,,,A69380076,
2289,1 Bedroom House for sale in Saraspur,indiabulls centrum ahmedabad,Price on Request,,(54 sq.m.) Built-up Area,Built Up area: 585 (54.35 sq.m.),1 Bedroom,1 Bathroom,No Balcony,,"Saraspur, Saraspur, Ahmedabad East, Ahmedabad",5 Floors,,undefined,"['Hatkeshwar mandir', 'Visa Hanuman', 'Dwarkad...",1bhk residential house for rent in indiabulls ...,"['1 Light', 'No AC', 'No Bed', 'No Chimney', '...",,"['Lifestyle3.8 out of 5', 'Connectivity3.9 out...",A69209380,


In [46]:
df = df[df['price'] != 'Price on Request']

In [47]:
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual bunglowe,1.25 Crore,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3 Bedrooms,3 Bathrooms,1 Balcony,Pooja Room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,goyal green park,3 Crore,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4 Bedrooms,4 Bathrooms,2 Balconies,"Pooja Room,Study Room,Store Room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
2,3 Bedroom House for sale in Kasindra,laxmi residency,,,(156 sq.m.) Built-up Area,,,,,,"Kasindra, Ahmedabad South, Ahmedabad",,,,"['D Mart', 'NH 751', 'Shree SL Patel High Scho...",Laxmi residency is a residential development b...,,,,Y70193200,
3,2 Bedroom House for sale in Dhegam,good times by sangath ipl,,,(64-87 sq.m.) Carpet Area,,,,,,"Dhegam, Gandhinagar, Ahmedabad",,,,,"Sangath good times in dhegam, gandhinagar & sa...",,,,X68471696,
4,5 Bedroom House for sale in Thaltej,anurita bungalows,,,(590 sq.m.) Super built-up Area,,,,,,"Thaltej, Ahmedabad West, Ahmedabad",,,,"['Shilaj Circle', 'Anand Niketan Campus', 'Sci...",Anurita is strategically located at thaltej-Sh...,,,"['Lifestyle4.5 out of 5', 'Connectivity4.3 out...",X70883980,


In [48]:
def treat_price(x):
    if type(x) == float:
        return x
    else:
        if x[1] == 'Lac':
            return round(float(x[0])/100,2)
        else:
            return round(float(x[0]),2)

In [49]:
df['price'] = df['price'].str.split(' ').apply(treat_price)

In [50]:
df.head(5)

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual bunglowe,1.25,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3 Bedrooms,3 Bathrooms,1 Balcony,Pooja Room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,goyal green park,3.0,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4 Bedrooms,4 Bathrooms,2 Balconies,"Pooja Room,Study Room,Store Room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
2,3 Bedroom House for sale in Kasindra,laxmi residency,,,(156 sq.m.) Built-up Area,,,,,,"Kasindra, Ahmedabad South, Ahmedabad",,,,"['D Mart', 'NH 751', 'Shree SL Patel High Scho...",Laxmi residency is a residential development b...,,,,Y70193200,
3,2 Bedroom House for sale in Dhegam,good times by sangath ipl,,,(64-87 sq.m.) Carpet Area,,,,,,"Dhegam, Gandhinagar, Ahmedabad",,,,,"Sangath good times in dhegam, gandhinagar & sa...",,,,X68471696,
4,5 Bedroom House for sale in Thaltej,anurita bungalows,,,(590 sq.m.) Super built-up Area,,,,,,"Thaltej, Ahmedabad West, Ahmedabad",,,,"['Shilaj Circle', 'Anand Niketan Campus', 'Sci...",Anurita is strategically located at thaltej-Sh...,,,"['Lifestyle4.5 out of 5', 'Connectivity4.3 out...",X70883980,


In [51]:
# price_per_sqft
df['price_per_sqft'].value_counts()

price_per_sqft
(167 sq.m.) Plot Area                  63
(251 sq.m.) Plot Area                  46
(84 sq.m.) Plot Area                   36
₹ 4,444/sq.ft.                         34
(125 sq.m.) Plot Area                  34
(209 sq.m.) Plot Area                  32
₹ 4,000/sq.ft.                         29
₹ 5,000/sq.ft.                         29
(334 sq.m.) Plot Area                  26
(201 sq.m.) Plot Area                  22
₹ 3,333/sq.ft.                         22
(93 sq.m.) Plot Area                   20
(100 sq.m.) Plot Area                  19
(176 sq.m.) Plot Area                  19
(111 sq.m.) Plot Area                  18
(151 sq.m.) Plot Area                  18
(142 sq.m.) Plot Area                  18
(234 sq.m.) Plot Area                  18
₹ 7,200/sq.ft.                         17
(139 sq.m.) Plot Area                  17
(502 sq.m.) Plot Area                  17
₹ 6,666/sq.ft.                         16
₹ 7,500/sq.ft.                         16
₹ 8,000/sq.ft.     

In [52]:
df['price_per_sqft'] = df['price_per_sqft'].str.split('/').str.get(0).str.replace('₹','').str.replace(',','').str.strip().astype('float')

ValueError: could not convert string to float: '(140 sq.m.) Plot Area'

In [None]:
df.head()

In [None]:
# bedrooms
df['bedRoom'].value_counts()

In [53]:
df[df['bedRoom'].isnull()]

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
2,3 Bedroom House for sale in Kasindra,laxmi residency,,,(156 sq.m.) Built-up Area,,,,,,"Kasindra, Ahmedabad South, Ahmedabad",,,,"['D Mart', 'NH 751', 'Shree SL Patel High Scho...",Laxmi residency is a residential development b...,,,,Y70193200,
3,2 Bedroom House for sale in Dhegam,good times by sangath ipl,,,(64-87 sq.m.) Carpet Area,,,,,,"Dhegam, Gandhinagar, Ahmedabad",,,,,"Sangath good times in dhegam, gandhinagar & sa...",,,,X68471696,
4,5 Bedroom House for sale in Thaltej,anurita bungalows,,,(590 sq.m.) Super built-up Area,,,,,,"Thaltej, Ahmedabad West, Ahmedabad",,,,"['Shilaj Circle', 'Anand Niketan Campus', 'Sci...",Anurita is strategically located at thaltej-Sh...,,,"['Lifestyle4.5 out of 5', 'Connectivity4.3 out...",X70883980,
5,4 Bedroom House for sale in Thaltej,anurita bungalows,,,(559 sq.m.) Super built-up Area,,,,,,"Thaltej, Ahmedabad West, Ahmedabad",,,,"['Shilaj Circle', 'Anand Niketan Campus', 'Sci...",Anurita is strategically located at thaltej-Sh...,,,"['Lifestyle4.5 out of 5', 'Connectivity4.3 out...",D70883978,
6,5 Bedroom House for sale in Sargasan,saamarth city,,,(737 sq.m.) Built-up Area,,,,,,"Sargasan, Gandhinagar, Ahmedabad",,,,"['Shree Mahakali Mataji Temple', 'Shree Verai ...",Saamarth city at well developed area of gandhi...,,,"['Lifestyle4.1 out of 5', 'Connectivity4.2 out...",D68100884,
7,4 Bedroom House for sale in Sargasan,saamarth city,,,(439-710 sq.m.) Built-up Area,,,,,,"Sargasan, Gandhinagar, Ahmedabad",,,,"['Shree Mahakali Mataji Temple', 'Shree Verai ...",Saamarth city at well developed area of gandhi...,,,"['Lifestyle4.1 out of 5', 'Connectivity4.2 out...",P68100882,
8,5 Bedroom House for sale in Raysan,saamarth lavish villa,,,(760-772 sq.m.) Built-up Area,,,,,,"Raysan, Gandhinagar, Ahmedabad",,,,"['Metro Station', 'Jain Derasar', 'Ahmedabad H...","At saamarth lavish villa, right from choosing ...",,,"['Lifestyle3.9 out of 5', 'Connectivity3.8 out...",S69403456,
9,4 Bedroom House for sale in Raysan,saamarth lavish villa,,,(498-718 sq.m.) Built-up Area,,,,,,"Raysan, Gandhinagar, Ahmedabad",,,,"['Metro Station', 'Jain Derasar', 'Ahmedabad H...","At saamarth lavish villa, right from choosing ...",,,"['Lifestyle3.9 out of 5', 'Connectivity3.8 out...",V69403454,
10,5 Bedroom House for sale in Shilaj,swagat bagan ville,,,(347-430 sq.m.) Carpet Area,,,,,,"Shilaj, Ahmedabad West, Ahmedabad",,,,"['Excellent Academy', 'Amrut Indian School', '...","Swagat bagan ville in shilaj, ahmedabad west b...",,,"['Lifestyle3.8 out of 5', 'Connectivity4 out o...",C70059662,
11,2 Bedroom House for sale in Agol,shades of nature,,,(184 sq.m.) Super built-up Area,,,,,,"Agol, Ahmedabad West, Ahmedabad",,,,"['New Karnavati Club', 'New Rajpath Club', 'Th...","Lavish, is the only way to describe these beau...",,,,V70686380,


In [54]:
df = df[~df['bedRoom'].isnull()]

In [55]:
df['bedRoom'] = df['bedRoom'].str.split(' ').str.get(0).astype('int')

In [56]:
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual bunglowe,1.25,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3,3 Bathrooms,1 Balcony,Pooja Room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,goyal green park,3.0,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4,4 Bathrooms,2 Balconies,"Pooja Room,Study Room,Store Room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
13,3 Bedroom House for sale in Randheja,maruti nandan green,0.8,"₹ 4,400/sq.ft.",(169 sq.m.) Plot Area,Plot area 202(168.9 sq.m.),3,4 Bathrooms,1 Balcony,Pooja Room,"Randheja, Gandhinagar, Ahmedabad",2 Floors,North-East,Under Construction,,Check out this 3 bhk house for sale in randhej...,,,,W68654880,
18,3 Bedroom House for sale in Bopal,"b/37, jahanvi bungalows",3.2,"₹ 37,427/sq.ft.",(309 sq.m.) Plot Area,Plot area 370(309.37 sq.m.)Built Up area: 176 ...,3,3 Bathrooms,2 Balconies,,"B/37, Bopal, Ahmedabad West, Ahmedabad",3 Floors,North,10+ Year Old,"['Icici ATM', 'Hdfc ATM', 'Atm hdfc bank', 'Ax...",An impeccable opportunity is here for those wh...,"['4 Wardrobe', '13 Fan', '1 Exhaust Fan', '2 G...","['Private Garden / Terrace', 'Water purifier',...","['Lifestyle4.2 out of 5', 'Connectivity4.3 out...",U69163438,
19,5 Bedroom House for sale in Enasan,akash grand city,4.35,"₹ 8,606/sq.ft.",(486 sq.m.) Plot Area,Plot area 581(485.79 sq.m.),5,6 Bathrooms,1 Balcony,,"Enasan, Ahmedabad North, Ahmedabad",2 Floors,,1 to 5 Year Old,,I have a house/villa available for sale in ena...,[],['Club house / Community Center'],,M68168346,


In [57]:
# bathroom
df['bathroom'].value_counts()

bathroom
2 Bathrooms     2332
3 Bathrooms     2060
4 Bathrooms     1206
1 Bathroom       569
5 Bathrooms      318
6 Bathrooms       65
7 Bathrooms       13
8 Bathrooms        9
10 Bathrooms       4
9 Bathrooms        2
16 Bathrooms       1
Name: count, dtype: int64

In [58]:
df['bathroom'].isnull().sum()

0

In [59]:
df['bathroom'] = df['bathroom'].str.split(' ').str.get(0).astype('int')

In [60]:
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual bunglowe,1.25,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3,3,1 Balcony,Pooja Room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,goyal green park,3.0,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4,4,2 Balconies,"Pooja Room,Study Room,Store Room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
13,3 Bedroom House for sale in Randheja,maruti nandan green,0.8,"₹ 4,400/sq.ft.",(169 sq.m.) Plot Area,Plot area 202(168.9 sq.m.),3,4,1 Balcony,Pooja Room,"Randheja, Gandhinagar, Ahmedabad",2 Floors,North-East,Under Construction,,Check out this 3 bhk house for sale in randhej...,,,,W68654880,
18,3 Bedroom House for sale in Bopal,"b/37, jahanvi bungalows",3.2,"₹ 37,427/sq.ft.",(309 sq.m.) Plot Area,Plot area 370(309.37 sq.m.)Built Up area: 176 ...,3,3,2 Balconies,,"B/37, Bopal, Ahmedabad West, Ahmedabad",3 Floors,North,10+ Year Old,"['Icici ATM', 'Hdfc ATM', 'Atm hdfc bank', 'Ax...",An impeccable opportunity is here for those wh...,"['4 Wardrobe', '13 Fan', '1 Exhaust Fan', '2 G...","['Private Garden / Terrace', 'Water purifier',...","['Lifestyle4.2 out of 5', 'Connectivity4.3 out...",U69163438,
19,5 Bedroom House for sale in Enasan,akash grand city,4.35,"₹ 8,606/sq.ft.",(486 sq.m.) Plot Area,Plot area 581(485.79 sq.m.),5,6,1 Balcony,,"Enasan, Ahmedabad North, Ahmedabad",2 Floors,,1 to 5 Year Old,,I have a house/villa available for sale in ena...,[],['Club house / Community Center'],,M68168346,


In [61]:
# balcony
df['balcony'].value_counts()

balcony
1 Balcony       3063
2 Balconies     2001
No Balcony       719
3 Balconies      619
3+ Balconies     177
Name: count, dtype: int64

In [62]:
df['balcony'].isnull().sum()

0

In [63]:
df['balcony'] = df['balcony'].str.split(' ').str.get(0).str.replace('No','0')

In [64]:
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual bunglowe,1.25,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3,3,1,Pooja Room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,goyal green park,3.0,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4,4,2,"Pooja Room,Study Room,Store Room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
13,3 Bedroom House for sale in Randheja,maruti nandan green,0.8,"₹ 4,400/sq.ft.",(169 sq.m.) Plot Area,Plot area 202(168.9 sq.m.),3,4,1,Pooja Room,"Randheja, Gandhinagar, Ahmedabad",2 Floors,North-East,Under Construction,,Check out this 3 bhk house for sale in randhej...,,,,W68654880,
18,3 Bedroom House for sale in Bopal,"b/37, jahanvi bungalows",3.2,"₹ 37,427/sq.ft.",(309 sq.m.) Plot Area,Plot area 370(309.37 sq.m.)Built Up area: 176 ...,3,3,2,,"B/37, Bopal, Ahmedabad West, Ahmedabad",3 Floors,North,10+ Year Old,"['Icici ATM', 'Hdfc ATM', 'Atm hdfc bank', 'Ax...",An impeccable opportunity is here for those wh...,"['4 Wardrobe', '13 Fan', '1 Exhaust Fan', '2 G...","['Private Garden / Terrace', 'Water purifier',...","['Lifestyle4.2 out of 5', 'Connectivity4.3 out...",U69163438,
19,5 Bedroom House for sale in Enasan,akash grand city,4.35,"₹ 8,606/sq.ft.",(486 sq.m.) Plot Area,Plot area 581(485.79 sq.m.),5,6,1,,"Enasan, Ahmedabad North, Ahmedabad",2 Floors,,1 to 5 Year Old,,I have a house/villa available for sale in ena...,[],['Club house / Community Center'],,M68168346,


In [65]:
# additionalRoom
df['additionalRoom'].value_counts()

additionalRoom
Store Room                                              876
Others                                                  476
Pooja Room                                              312
Pooja Room,Study Room,Store Room                        253
Pooja Room,Store Room                                   235
Pooja Room,Store Room,Study Room                        193
Pooja Room,Study Room,Servant Room,Store Room           140
Pooja Room,Study Room                                   128
Store Room,Pooja Room                                   111
Study Room                                               75
Pooja Room,Others                                        69
Pooja Room,Study Room,Servant Room,Others                65
Pooja Room,Study Room,Others                             54
Pooja Room,Study Room,Servant Room                       53
Servant Room                                             43
Study Room,Store Room                                    36
Pooja Room,Store Room,Stu

In [66]:
df['additionalRoom'].value_counts().shape

(73,)

In [67]:
df['additionalRoom'].isnull().sum()

3074

In [68]:
df['additionalRoom'].fillna('not available',inplace=True)

In [69]:
df['additionalRoom'] = df['additionalRoom'].str.lower()

In [70]:
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual bunglowe,1.25,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3,3,1,pooja room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,goyal green park,3.0,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4,4,2,"pooja room,study room,store room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
13,3 Bedroom House for sale in Randheja,maruti nandan green,0.8,"₹ 4,400/sq.ft.",(169 sq.m.) Plot Area,Plot area 202(168.9 sq.m.),3,4,1,pooja room,"Randheja, Gandhinagar, Ahmedabad",2 Floors,North-East,Under Construction,,Check out this 3 bhk house for sale in randhej...,,,,W68654880,
18,3 Bedroom House for sale in Bopal,"b/37, jahanvi bungalows",3.2,"₹ 37,427/sq.ft.",(309 sq.m.) Plot Area,Plot area 370(309.37 sq.m.)Built Up area: 176 ...,3,3,2,not available,"B/37, Bopal, Ahmedabad West, Ahmedabad",3 Floors,North,10+ Year Old,"['Icici ATM', 'Hdfc ATM', 'Atm hdfc bank', 'Ax...",An impeccable opportunity is here for those wh...,"['4 Wardrobe', '13 Fan', '1 Exhaust Fan', '2 G...","['Private Garden / Terrace', 'Water purifier',...","['Lifestyle4.2 out of 5', 'Connectivity4.3 out...",U69163438,
19,5 Bedroom House for sale in Enasan,akash grand city,4.35,"₹ 8,606/sq.ft.",(486 sq.m.) Plot Area,Plot area 581(485.79 sq.m.),5,6,1,not available,"Enasan, Ahmedabad North, Ahmedabad",2 Floors,,1 to 5 Year Old,,I have a house/villa available for sale in ena...,[],['Club house / Community Center'],,M68168346,


In [71]:
# floor num
df['floorNum']

0                             NaN
1                             NaN
13                            NaN
18                            NaN
19                            NaN
23                            NaN
24                            NaN
25                            NaN
26                            NaN
28                            NaN
29                            NaN
30                            NaN
31                            NaN
32                            NaN
33                            NaN
37                            NaN
38                            NaN
39                            NaN
40                            NaN
48                            NaN
49                            NaN
50                            NaN
51                            NaN
52                            NaN
53                            NaN
54                            NaN
56                            NaN
57                            NaN
58                            NaN
59            

In [72]:
df['floorNum'].isnull().sum()

2452

In [73]:
df[df['floorNum'].isnull()]

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual bunglowe,1.25,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3,3,1,pooja room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,goyal green park,3.0,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4,4,2,"pooja room,study room,store room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
13,3 Bedroom House for sale in Randheja,maruti nandan green,0.8,"₹ 4,400/sq.ft.",(169 sq.m.) Plot Area,Plot area 202(168.9 sq.m.),3,4,1,pooja room,"Randheja, Gandhinagar, Ahmedabad",2 Floors,North-East,Under Construction,,Check out this 3 bhk house for sale in randhej...,,,,W68654880,
18,3 Bedroom House for sale in Bopal,"b/37, jahanvi bungalows",3.2,"₹ 37,427/sq.ft.",(309 sq.m.) Plot Area,Plot area 370(309.37 sq.m.)Built Up area: 176 ...,3,3,2,not available,"B/37, Bopal, Ahmedabad West, Ahmedabad",3 Floors,North,10+ Year Old,"['Icici ATM', 'Hdfc ATM', 'Atm hdfc bank', 'Ax...",An impeccable opportunity is here for those wh...,"['4 Wardrobe', '13 Fan', '1 Exhaust Fan', '2 G...","['Private Garden / Terrace', 'Water purifier',...","['Lifestyle4.2 out of 5', 'Connectivity4.3 out...",U69163438,
19,5 Bedroom House for sale in Enasan,akash grand city,4.35,"₹ 8,606/sq.ft.",(486 sq.m.) Plot Area,Plot area 581(485.79 sq.m.),5,6,1,not available,"Enasan, Ahmedabad North, Ahmedabad",2 Floors,,1 to 5 Year Old,,I have a house/villa available for sale in ena...,[],['Club house / Community Center'],,M68168346,
23,4 Bedroom House for sale in Khoraj,sentossa greens 88 b,4.45,"₹ 7,607/sq.ft.",(543 sq.m.) Plot Area,Plot area 650(543.48 sq.m.),4,5,2,not available,"Khoraj, Gandhinagar, Ahmedabad",3 Floors,North-East,1 to 5 Year Old,"['ISKON Temple', 'Paramdham Temple', 'Prerna T...",Stunning independent house villa for sale in s...,[],,,I70268328,
24,6 Bedroom House for sale in Sabarmati,,3.95,"₹ 15,007/sq.ft.",(260 sq.m.) Plot Area,Plot area 260,6,6,3+,"others,store room","Sabarmati, Ahmedabad North, Ahmedabad",3 Floors,North-East,10+ Year Old,"['Dharmeshawar Mahadev Temple', 'Vaishno Devi ...",Stunning independent house villa for sale in s...,"['6 Wardrobe', '9 Fan', '2 Geyser', '23 Light'...","['Feng Shui / Vaastu Compliant', 'High Ceiling...","['Lifestyle3.7 out of 5', 'Connectivity3.9 out...",T68736686,
25,3 Bedroom House for sale in Bhadaj,supercity glory,3.65,"₹ 11,721/sq.ft.",(289 sq.m.) Plot Area,Plot area 346(289.3 sq.m.),3,4,1,pooja room,"Bhadaj, Ahmedabad West, Ahmedabad",2 Floors,,0 to 1 Year Old,,New independent house for sale,,"['Private Garden / Terrace', 'Water Storage', ...",,S66292738,
26,3 Bedroom House for sale in Sanathal,pacifica the meadows,1.75,"₹ 7,936/sq.ft.",(176 sq.m.) Plot Area,Plot area 211(176.42 sq.m.)Built Up area: 245 ...,3,4,1,pooja room,"Sanathal, Ahmedabad West, Ahmedabad",2 Floors,West,5 to 10 Year Old,"['Eklavya School', 'Jogmaya temple', 'ICICI AT...",All bedrooms have daikin 1.5t acs installed. M...,"['6 Wardrobe', '3 Bed', '1 Water Purifier', '8...","['Water purifier', 'No open drainage around', ...",,F66827424,
28,2 Bedroom House for sale in Bavla,bellevue vieraaa by davda infra,0.5,"₹ 3,472/sq.ft.",(134 sq.m.) Plot Area,Plot area 160(133.78 sq.m.),2,3,1,not available,"413, Bavla, Ahmedabad South, Ahmedabad",2 Floors,East,1 to 5 Year Old,"['Brand Factory', 'Sun Avenue', 'New Samarath ...","East facing, vastu compliance peace ful area\n...",,"['Private Garden / Terrace', 'Maintenance Staf...","['Lifestyle3.5 out of 5', 'Connectivity3.8 out...",E67509880,


In [74]:
df['floorNum'] = df['floorNum'].str.split(' ').str.get(0).replace('Ground','0').str.replace('Basement','-1').str.replace('Lower','0').str.extract(r'(\d+)')

In [75]:
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual bunglowe,1.25,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3,3,1,pooja room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,goyal green park,3.0,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4,4,2,"pooja room,study room,store room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
13,3 Bedroom House for sale in Randheja,maruti nandan green,0.8,"₹ 4,400/sq.ft.",(169 sq.m.) Plot Area,Plot area 202(168.9 sq.m.),3,4,1,pooja room,"Randheja, Gandhinagar, Ahmedabad",2 Floors,North-East,Under Construction,,Check out this 3 bhk house for sale in randhej...,,,,W68654880,
18,3 Bedroom House for sale in Bopal,"b/37, jahanvi bungalows",3.2,"₹ 37,427/sq.ft.",(309 sq.m.) Plot Area,Plot area 370(309.37 sq.m.)Built Up area: 176 ...,3,3,2,not available,"B/37, Bopal, Ahmedabad West, Ahmedabad",3 Floors,North,10+ Year Old,"['Icici ATM', 'Hdfc ATM', 'Atm hdfc bank', 'Ax...",An impeccable opportunity is here for those wh...,"['4 Wardrobe', '13 Fan', '1 Exhaust Fan', '2 G...","['Private Garden / Terrace', 'Water purifier',...","['Lifestyle4.2 out of 5', 'Connectivity4.3 out...",U69163438,
19,5 Bedroom House for sale in Enasan,akash grand city,4.35,"₹ 8,606/sq.ft.",(486 sq.m.) Plot Area,Plot area 581(485.79 sq.m.),5,6,1,not available,"Enasan, Ahmedabad North, Ahmedabad",2 Floors,,1 to 5 Year Old,,I have a house/villa available for sale in ena...,[],['Club house / Community Center'],,M68168346,


In [76]:
# facing
df['facing'].value_counts()

facing
East          2210
North-East     668
West           645
North          406
North-West     226
South          136
South-West     124
South-East     115
Name: count, dtype: int64

In [77]:
df['facing'].isnull().sum()

2049

In [78]:
df['facing'].fillna('NA',inplace=True)

In [79]:
df['facing'].value_counts()

facing
East          2210
NA            2049
North-East     668
West           645
North          406
North-West     226
South          136
South-West     124
South-East     115
Name: count, dtype: int64

In [85]:
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual bunglowe,1.25,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3,3,1,pooja room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,goyal green park,3.0,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4,4,2,"pooja room,study room,store room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
13,3 Bedroom House for sale in Randheja,maruti nandan green,0.8,"₹ 4,400/sq.ft.",(169 sq.m.) Plot Area,Plot area 202(168.9 sq.m.),3,4,1,pooja room,"Randheja, Gandhinagar, Ahmedabad",2 Floors,North-East,Under Construction,,Check out this 3 bhk house for sale in randhej...,,,,W68654880,
18,3 Bedroom House for sale in Bopal,"b/37, jahanvi bungalows",3.2,"₹ 37,427/sq.ft.",(309 sq.m.) Plot Area,Plot area 370(309.37 sq.m.)Built Up area: 176 ...,3,3,2,not available,"B/37, Bopal, Ahmedabad West, Ahmedabad",3 Floors,North,10+ Year Old,"['Icici ATM', 'Hdfc ATM', 'Atm hdfc bank', 'Ax...",An impeccable opportunity is here for those wh...,"['4 Wardrobe', '13 Fan', '1 Exhaust Fan', '2 G...","['Private Garden / Terrace', 'Water purifier',...","['Lifestyle4.2 out of 5', 'Connectivity4.3 out...",U69163438,
19,5 Bedroom House for sale in Enasan,akash grand city,4.35,"₹ 8,606/sq.ft.",(486 sq.m.) Plot Area,Plot area 581(485.79 sq.m.),5,6,1,not available,"Enasan, Ahmedabad North, Ahmedabad",2 Floors,,1 to 5 Year Old,,I have a house/villa available for sale in ena...,[],['Club house / Community Center'],,M68168346,


In [80]:
df.insert(loc=4,column='area',value=round((df['price']*10000000)/df['price_per_sqft']))

TypeError: unsupported operand type(s) for /: 'float' and 'str'

In [None]:
df.insert(loc=1,column='property_type',value='flat')

In [81]:
df.head()

Unnamed: 0,property_name,society,price,rate,price_per_sqft,areaWithType,bedRoom,bathroom,balcony,additionalRoom,address,noOfFloor,facing,agePossession,nearbyLocations,description,furnishDetails,features,rating,property_id,floorNum
0,3 Bedroom House for sale in Ghuma,individual bunglowe,1.25,"₹ 8,267/sq.ft.",(140 sq.m.) Plot Area,Plot area 168(140.47 sq.m.),3,3,1,pooja room,"Ghuma, Ahmedabad West, Ahmedabad",2 Floors,South-East,5 to 10 Year Old,"['Atm hdfc bank', 'State bank of india sbi ATM...",Are you planning to buy your dream home? You c...,,"['Feng Shui / Vaastu Compliant', 'Visitor Park...","['Lifestyle3.7 out of 5', 'Connectivity4.1 out...",Y66780728,
1,4 Bedroom House for sale in Sanathal,goyal green park,3.0,"₹ 8,333/sq.ft.",(334 sq.m.) Plot Area,Plot area 400(334.45 sq.m.)Built Up area: 350 ...,4,4,2,"pooja room,study room,store room","Sanathal, Ahmedabad West, Ahmedabad",2 Floors,South-West,10+ Year Old,"['Sahyog General Hospital and Nursing Home', '...",A residential bungalows is available for sale ...,,"['Feng Shui / Vaastu Compliant', 'Private Gard...",,V69832032,
13,3 Bedroom House for sale in Randheja,maruti nandan green,0.8,"₹ 4,400/sq.ft.",(169 sq.m.) Plot Area,Plot area 202(168.9 sq.m.),3,4,1,pooja room,"Randheja, Gandhinagar, Ahmedabad",2 Floors,North-East,Under Construction,,Check out this 3 bhk house for sale in randhej...,,,,W68654880,
18,3 Bedroom House for sale in Bopal,"b/37, jahanvi bungalows",3.2,"₹ 37,427/sq.ft.",(309 sq.m.) Plot Area,Plot area 370(309.37 sq.m.)Built Up area: 176 ...,3,3,2,not available,"B/37, Bopal, Ahmedabad West, Ahmedabad",3 Floors,North,10+ Year Old,"['Icici ATM', 'Hdfc ATM', 'Atm hdfc bank', 'Ax...",An impeccable opportunity is here for those wh...,"['4 Wardrobe', '13 Fan', '1 Exhaust Fan', '2 G...","['Private Garden / Terrace', 'Water purifier',...","['Lifestyle4.2 out of 5', 'Connectivity4.3 out...",U69163438,
19,5 Bedroom House for sale in Enasan,akash grand city,4.35,"₹ 8,606/sq.ft.",(486 sq.m.) Plot Area,Plot area 581(485.79 sq.m.),5,6,1,not available,"Enasan, Ahmedabad North, Ahmedabad",2 Floors,,1 to 5 Year Old,,I have a house/villa available for sale in ena...,[],['Club house / Community Center'],,M68168346,


In [82]:
df.info()

<class 'pandas.core.frame.DataFrame'>
Index: 6579 entries, 0 to 7089
Data columns (total 21 columns):
 #   Column           Non-Null Count  Dtype  
---  ------           --------------  -----  
 0   property_name    6579 non-null   object 
 1   society          6579 non-null   object 
 2   price            6561 non-null   float64
 3   rate             2442 non-null   object 
 4   price_per_sqft   6569 non-null   object 
 5   areaWithType     6579 non-null   object 
 6   bedRoom          6579 non-null   int32  
 7   bathroom         6579 non-null   int32  
 8   balcony          6579 non-null   object 
 9   additionalRoom   6579 non-null   object 
 10  address          6546 non-null   object 
 11  noOfFloor        2381 non-null   object 
 12  facing           6579 non-null   object 
 13  agePossession    6579 non-null   object 
 14  nearbyLocations  5860 non-null   object 
 15  description      6579 non-null   object 
 16  furnishDetails   3838 non-null   object 
 17  features         49

In [83]:
df.shape

(6579, 21)

In [84]:
df.to_csv(out_path / 'flats_cleaned.csv',index=False)