In [1]:
# Dependencies and Setup
import pandas as pd
import numpy as np
import json
import requests

In [2]:
# House Rent data reading  and store into Pandas DataFrames
file_path = "Resources/House_Rent_Dataset.csv"
House_Rent_df = pd.read_csv(file_path)
House_Rent_df.head()

Unnamed: 0,Posted On,BHK,Rent,Size,Floor,Area Type,Area Locality,City,Furnishing Status,Tenant Preferred,Bathroom,Point of Contact
0,2022-05-18,2,10000,1100,Ground out of 2,Super Area,Bandel,Kolkata,Unfurnished,Bachelors/Family,2,Contact Owner
1,2022-05-13,2,20000,800,1 out of 3,Super Area,"Phool Bagan, Kankurgachi",Kolkata,Semi-Furnished,Bachelors/Family,1,Contact Owner
2,2022-05-16,2,17000,1000,1 out of 3,Super Area,Salt Lake City Sector 2,Kolkata,Semi-Furnished,Bachelors/Family,1,Contact Owner
3,2022-07-04,2,10000,800,1 out of 2,Super Area,Dumdum Park,Kolkata,Unfurnished,Bachelors/Family,1,Contact Owner
4,2022-05-09,2,7500,850,1 out of 2,Carpet Area,South Dum Dum,Kolkata,Unfurnished,Bachelors,1,Contact Owner


In [3]:
House_Rent_df.shape

(4746, 12)

In [4]:
# Features of the dataset
House_Rent_df.columns

Index(['Posted On', 'BHK', 'Rent', 'Size', 'Floor', 'Area Type',
       'Area Locality', 'City', 'Furnishing Status', 'Tenant Preferred',
       'Bathroom', 'Point of Contact'],
      dtype='object')

In [5]:
# Check data types
House_Rent_df.dtypes

Posted On            object
BHK                   int64
Rent                  int64
Size                  int64
Floor                object
Area Type            object
Area Locality        object
City                 object
Furnishing Status    object
Tenant Preferred     object
Bathroom              int64
Point of Contact     object
dtype: object

In [6]:
# Count any null values
House_Rent_df.isnull().sum()

Posted On            0
BHK                  0
Rent                 0
Size                 0
Floor                0
Area Type            0
Area Locality        0
City                 0
Furnishing Status    0
Tenant Preferred     0
Bathroom             0
Point of Contact     0
dtype: int64

In [7]:
# Check for duplicate rows
House_Rent_df.duplicated().sum()

0

In [8]:
# Determine the number of unique values in each column.
House_Rent_df.nunique()

Posted On              81
BHK                     6
Rent                  243
Size                  615
Floor                 480
Area Type               3
Area Locality        2235
City                    6
Furnishing Status       3
Tenant Preferred        3
Bathroom                8
Point of Contact        3
dtype: int64

In [9]:
# Change Posted On to date type
House_Rent_df['Posted On'] =  pd.to_datetime(House_Rent_df['Posted On'])

In [10]:
# Add new column for month
House_Rent_df['posted_on'] = House_Rent_df['Posted On'].dt.month_name()

In [11]:
# Grabbing floor level and adding into a new column
House_Rent_df[["floor_level", "no_floors"]] = House_Rent_df["Floor"].str.split(" ", 1, expand=True)

In [12]:
## Using the city and rough address to find suburb data and adding to a new column

# Import API key
from api_keys import g_key

# Add column for suburb
House_Rent_df["suburb"] = ""

    # Use the city and rough address to find suburb data
for index, row in House_Rent_df.iterrows():
    
    target_city = f'{row["Area Locality"]},{row["City"]}'
    
    # params dictionary
    params = {"address": target_city, "key": g_key}
    
    # Build URL using the Google Maps API
    base_url = "https://maps.googleapis.com/maps/api/geocode/json"
    
    # Run request
    results = requests.get(base_url, params=params).json()
    
    
# Since some data may be missing we incorporate a try-except to skip any that are missing a data point.
    try:
        
        # Adding collected data to House_Rent_df
        House_Rent_df.loc[index, "suburb"] = results["results"][0]['address_components'][0]['short_name']
        
        print(f"data on. {target_city} found")
        
        # Add except 
    except (KeyError, IndexError):
        print(f"Suburb data not found. Skipping id. {target_city}....")
                  
        # Remove row if no data found
        House_Rent_df.drop(index, inplace=True)
    

data on. Bandel,Kolkata found
data on. Phool Bagan, Kankurgachi,Kolkata found
data on. Salt Lake City Sector 2,Kolkata found
data on. Dumdum Park,Kolkata found
data on. South Dum Dum,Kolkata found
data on. Thakurpukur,Kolkata found
data on. Malancha,Kolkata found
data on. Malancha,Kolkata found
data on. Palm Avenue Kolkata, Ballygunge,Kolkata found
data on. Natunhat,Kolkata found
data on. Action Area 1, Rajarhat Newtown,Kolkata found
data on. Keshtopur,Kolkata found
data on. Tarulia, Keshtopur,Kolkata found
data on. Dum Dum Metro,Kolkata found
data on. Paschim Barisha,Kolkata found
data on. New Town Action Area 1,Kolkata found
data on. Barasat,Kolkata found
data on. Behala,Kolkata found
data on. Behala Chowrasta,Kolkata found
data on. Behala,Kolkata found
data on. Santoshpur,Kolkata found
data on. Garia Station, Garia,Kolkata found
data on. Garia Station, Garia,Kolkata found
data on. Joka,Kolkata found
data on. Sreebhumi,Kolkata found
data on. Rajarhat,Kolkata found
data on. Dum Dum,Ko

data on. Salt Lake City Sector 2,Kolkata found
data on. locality,Kolkata found
data on. Khardah,Kolkata found
data on. Parnasree Pally,Kolkata found
data on. Baghajatin,Kolkata found
data on. Salt Lake City Sector 3,Kolkata found
data on. sarsuna banerjee para,Kolkata found
data on. Salt Lake City Sector 3,Kolkata found
data on. Near Seven Tanks Road Dumdum Station,Kolkata found
data on. Jyangra,Kolkata found
data on. Barasat,Kolkata found
data on. Sukchar,Kolkata found
data on. Tagore Park, Kasba,Kolkata found
data on. Barrackpore,Kolkata found
data on. Silpara, Purba Barisha,Kolkata found
data on. Konnagar,Kolkata found
data on. Madhyam Gram,Kolkata found
data on. Kudghat, Ashok Nagar,Kolkata found
data on. Salt Lake City Sector 5,Kolkata found
data on. Salt Lake City Sector 3,Kolkata found
data on. Dum Dum Cantonment,Kolkata found
data on. Kasba,Kolkata found
data on. Salt Lake City,Kolkata found
data on. Lake Gardens,Kolkata found
data on. Silpara, Purba Barisha,Kolkata found
data 

data on. Salt Lake City Sector 5,Kolkata found
data on. Dum Dum,Kolkata found
data on. Airport Area Behala,Kolkata found
data on. Sonarpur,Kolkata found
data on. Picnic Garden, E M Bypass,Kolkata found
data on. Bisharpara,Kolkata found
data on. Bisharpara,Kolkata found
data on. Nayabad,Kolkata found
data on. Ananda Pally, Jadavpur,Kolkata found
data on. Salt Lake City Sector 2,Kolkata found
data on. Behala,Kolkata found
data on. Airport Area,Kolkata found
data on. Salt Lake City Sector 2,Kolkata found
data on. Barrackpore,Kolkata found
data on. Ranikuthi Telephone Exchange,Kolkata found
data on. Hooghly-Chinsurah,Kolkata found
data on. Bansdroni Mauza, Krishnanagar,Kolkata found
data on. Kaikhali,Kolkata found
data on. 700051,Kolkata found
data on. Jodhpur Park,Kolkata found
data on. Purba Sinthi Area,Kolkata found
data on. Kadam Tala,Kolkata found
data on. Baidyabati,Kolkata found
data on. Bansdroni,Kolkata found
data on. Sodepur,Kolkata found
data on. Jagacha,Kolkata found
data on. N

data on. Malad East,Mumbai found
data on. Juhu Tara,Mumbai found
data on. Mindspace, Mindspace,Mumbai found
data on. Oberoi Esquire, Goregaon East,Mumbai found
data on. Oberoi Woods, Goregaon East,Mumbai found
data on. Vertical Bliss, Bandra West,Mumbai found
data on. Sher E Punjab Society,Mumbai found
data on. Oshiwara,Mumbai found
data on. Nirmal Lifestyle, LBS Marg,Mumbai found
data on. Lokhandwala Complex,Mumbai found
data on. Chembur,Mumbai found
data on. Tilak Nagar - Harbour Line,Mumbai found
data on. GREEN PARK,Mumbai found
data on. Lodha Ajuro tower lalbag,Mumbai found
data on. Lake Bloom, Powai,Mumbai found
data on. Kalina,Mumbai found
data on. Bhakti Park, Bhakti Park,Mumbai found
data on. Bombay Dyeing Two ICC, Dadar East,Mumbai found
data on. Santacruz West,Mumbai found
data on. MUKTA MAHEK, Thakur Complex,Mumbai found
data on. Kanakia Rainforest, Marol,Mumbai found
data on. Bandra West,Mumbai found
data on. Vile Parle West,Mumbai found
data on. Dheeraj Swapna Apartment, P

data on. Bandra West,Mumbai found
data on. Llyod Estate, Wadala,Mumbai found
data on. Lokhandwala Complex,Mumbai found
data on. Sunglow, Chandivali,Mumbai found
data on. Mahim West,Mumbai found
data on. Parle Colony,Mumbai found
data on. Andheri East,Mumbai found
data on. Chembur,Mumbai found
data on. Godrej Platinum, Vikhroli East,Mumbai found
data on. Chembur East,Mumbai found
data on. Raheja Heights Phase 2, Gokuldham,Mumbai found
data on. Sakhi, Kandivali West,Mumbai found
data on. Raheja Artesia, Worli,Mumbai found
data on. Rustomjee Regency, Gomant Nagar,Mumbai found
data on. Santacruz East,Mumbai found
data on. Vikas Finalay Apartments, Parel,Mumbai found
data on. Bhandup West,Mumbai found
data on. anjali,Mumbai found
data on. Runwal Greens, Mulund West,Mumbai found
data on. Best Nagar Goregaon West,Mumbai found
data on. Hiranandani Gardens Torino, Hiranandani Gardens,Mumbai found
data on. Chembur,Mumbai found
data on. Riddhi Garden, Film City Road,Mumbai found
data on. Dahisar 

data on. Chandivali,Mumbai found
data on. Juhu,Mumbai found
data on. Kandivali West,Mumbai found
data on. DLH Orchid, Lokhandwala Complex,Mumbai found
data on. Godrej Serenity Mumbai, Chembur,Mumbai found
data on. Transcon Triumph, Lokhandwala Complex,Mumbai found
data on. Chakala Cigarette Factory,Mumbai found
data on. Green Gate Apartment, Pali Hill,Mumbai found
data on. Kanjurmarg East,Mumbai found
data on. Model Town,Mumbai found
data on. Bandra West,Mumbai found
data on. Lake Primrose, Powai,Mumbai found
data on. Alta Monte, Pathanwadi,Mumbai found
data on. Dreams Complex, Bhandup West,Mumbai found
data on. NG Royal Park, Kanjurmarg East,Mumbai found
data on. Mukund Nagar,Mumbai found
data on. Ajmera Bhakti Park, Bhakti Park,Mumbai found
data on. Sindhi Society Chembur,Mumbai found
data on. Goregaon West,Mumbai found
data on. Chaitanya Towers, Prabhadevi,Mumbai found
data on. Bandra West,Mumbai found
data on. Parel,Mumbai found
data on. 7 Bungalow, Seven Bungalows,Mumbai found
dat

data on. Lodha Bellissimo, Mahalakshmi,Mumbai found
data on. simla house at nepeasea road, Napean Sea Road,Mumbai found
data on. Altavista, Chembur,Mumbai found
data on. Hubtown Gardenia, Mira Road,Mumbai found
data on. Andheri East,Mumbai found
data on. Promenade At The Address, Ghatkopar West,Mumbai found
data on. Vile Parle West,Mumbai found
data on. Khar West,Mumbai found
data on. Gaurav Excellency, Mira Road,Mumbai found
data on. Kanakia Paris, Bandra Kurla Complex,Mumbai found
data on. Salvation CHS, Dadar West,Mumbai found
data on. Hiranandani Gardens,Mumbai found
data on. Sanjona Gulmarg Towers, Chembur East,Mumbai found
data on. Bandra West,Mumbai found
data on. New Devchhaya Building,Mumbai found
data on. Goregaon West,Mumbai found
data on. Bandra West,Mumbai found
data on. Andheri East,Mumbai found
data on. Devi Pada,Mumbai found
data on. Lodha The Park, Worli,Mumbai found
data on. The Windsor, Kandivali East,Mumbai found
data on. Manavsthal, Andheri East,Mumbai found
data o

data on. Indraprastha CHS, Bhayandar East,Mumbai found
data on. Oberoi Splendor Grande, Agarkar Chowk,Mumbai found
data on. Spring Leaf, Lokhandwala Twp,Mumbai found
data on. Malad West,Mumbai found
data on. Khar West,Mumbai found
data on. Romell Aether, Goregaon East,Mumbai found
data on. Godrej The Trees, Vikhroli East,Mumbai found
data on. Borivali East,Mumbai found
data on. Mahajan Wadi,Mumbai found
data on. Film City,Mumbai found
data on. Lakshchandi Height, Goregaon East,Mumbai found
data on. Challenger Tower, Thakur Village, Kandivali East,Mumbai found
data on. Bhoomi Elegant, Thakur Complex,Mumbai found
data on. Adani Western Heights, Andheri West,Mumbai found
data on. Chandivali,Mumbai found
data on. Worli,Mumbai found
data on. Galassia, Kandarpada,Mumbai found
data on. Charkop,Mumbai found
data on. diamond garden, Chembur,Mumbai found
data on. Bandra West,Mumbai found
data on. Kalpataru Crest, Bhandup West,Mumbai found
data on. Hiranandani Castle Rock, Powai,Mumbai found
data

data on. Banaswadi,Bangalore found
data on. Kalasipalyam, Kalasipalyam,Bangalore found
data on. Tilak Nagar, Jayanagar, bannerghatta main Road,Bangalore found
data on. K R Puram,Bangalore found
data on. Electronic City,Bangalore found
data on. Sarjapur Road,Bangalore found
data on. whitefield,Bangalore found
data on. Nagondanahalli,Bangalore found
data on. Isro Layout, Kumaraswamy Layout,Bangalore found
data on. Banashankari,Bangalore found
data on. JAR Shikara,Bangalore found
data on. Medahalli,Bangalore found
data on. Electronic City Phase 2, Electronic City,Bangalore found
data on. Ramamurthy Nagar,Bangalore found
data on. Byatarayanapura,Bangalore found
data on. Udayanagar Extension, Mahadevapura,Bangalore found
data on. Dwarka Nagar, Kattigenahalli,Bangalore found
data on. Btm Layout,Bangalore found
data on. Jeevan Bima Nagar, Airport Road,Bangalore found
data on. Jaya Nagar Block 7, Jayanagar,Bangalore found
data on. Chamrajpet,Bangalore found
data on. Hosa Road, off Hosur Road,B

data on. Attibele,Bangalore found
data on. Devinagar, Outer Ring Road,Bangalore found
data on. Electronic City,Bangalore found
data on. Jp Nagar Phase 7, J P Nagar,Bangalore found
data on. Fci Layout, Deepanjali Nagar,Bangalore found
data on. Mathikere,Bangalore found
data on. Ombr Layout, Banaswadi,Bangalore found
data on. Sinthan Nagar, Thanisandra,Bangalore found
data on. Kengeri Hobli,Bangalore found
data on. Kodichikkanahalli Main Road,Bangalore found
data on. Mangammanapalya, Hosur Road,Bangalore found
data on. Uttarahalli,Bangalore found
data on. Malleshwaram,Bangalore found
data on. Immadihalli, Whitefield,Bangalore found
data on. Bydara Halli, Benson Town,Bangalore found
data on. Yelahanka,Bangalore found
data on. Electronic City,Bangalore found
data on. Jp Nagar Phase 7, J P Nagar,Bangalore found
data on. Chikkana Layout, Kammanahalli,Bangalore found
data on. Langford Town, Shanti Nagar, Hosur Road,Bangalore found
data on. Jaya Nagar Block 5, Jayanagar,Bangalore found
data on

data on. Jp Nagar Phase 5, J P Nagar, Outer Ring Road,Bangalore found
data on. Rayasandra,Bangalore found
data on. Shampura, Kaval Byrasandra,Bangalore found
data on. Bommasandra,Bangalore found
data on. Rajajinagar,Bangalore found
data on. Choodasandra,Bangalore found
data on. Arakere,Bangalore found
data on. New Thippasandra,Bangalore found
data on. Battarahalli,Bangalore found
data on. A Narayanapura, Mahadevapura,Bangalore found
data on. Banashankari,Bangalore found
data on. New Bel Road,Bangalore found
data on. Gunjur,Bangalore found
data on. Anantapura,Bangalore found
data on. Hulimavu,Bangalore found
data on. Ombr Layout, Banaswadi,Bangalore found
data on. Hongasandra,Bangalore found
data on. Chamrajpet,Bangalore found
data on. Sahakara Nagar,Bangalore found
data on. K R Puram,Bangalore found
data on. Mathikere,Bangalore found
data on. Kanakapura Road,Bangalore found
data on. Jp Nagar Phase 7, J P Nagar,Bangalore found
data on. Hebbal,Bangalore found
data on. Adugodi,Bangalore f

data on. Murugeshpalya, Airport Road,Bangalore found
data on. Electronics City Phase 1, Electronic City,Bangalore found
data on. Bilal Nagar-Sagayapura,Bangalore found
data on. Lakshmipura,Bangalore found
data on. Btm Layout,Bangalore found
data on. Mathikere,Bangalore found
data on. Kudlu Gate,Bangalore found
data on. Nagarbhavi,Bangalore found
data on. Attibele,Bangalore found
data on. Yelahanka,Bangalore found
data on. Hrbr Layout Block 2, Kalyan Nagar, Outer Ring Road,Bangalore found
data on. C V Raman Nagar,Bangalore found
data on. Kengeri,Bangalore found
data on. Rayasandra,Bangalore found
data on. C V Raman Nagar,Bangalore found
data on. Basaveshvara Nagar,Bangalore found
data on. Hulimavu,Bangalore found
data on. snv la,Bangalore found
data on. Rmv Extension, Armane Nagar,Bangalore found
data on. Ittamadu, Banashankari, Outer Ring Road,Bangalore found
data on. Kengeri Upanagara,Bangalore found
data on. Koramangala,Bangalore found
data on. K R Puram,Bangalore found
data on. Basa

data on. Vijayanagar,Bangalore found
data on. T Dasarahalli,Bangalore found
data on. Mahadevapura,Bangalore found
data on. Electronics City Phase 1, Electronic City,Bangalore found
data on. Btm Layout,Bangalore found
data on. Vinayak Nagar, Kattigenahalli,Bangalore found
data on. Ganga Nagar,Bangalore found
data on. Electronic City Phase 2, Electronic City,Bangalore found
data on. Banashankari,Bangalore found
data on. Gh society,Bangalore found
data on. Vijayanagar,Bangalore found
data on. Wilson Garden,Bangalore found
data on. Electronic City,Bangalore found
data on. Koramangala,Bangalore found
data on. Hebbal,Bangalore found
data on. Dooravani Nagar, Dooravani Nagar,Bangalore found
data on. Murugeshpalya, Airport Road,Bangalore found
data on. Srinivasa Nagar-Banashankari, Banashankari,Bangalore found
data on. Uttarahalli,Bangalore found
data on. Yelahanka,Bangalore found
data on. Hbr Layout,Bangalore found
data on. Cunningham Road,Bangalore found
data on. Mahadevapura,Bangalore found

data on. Kalkaji,Delhi found
data on. Mehrauli,Delhi found
data on. Rangpuri,Delhi found
data on. Lajpat Nagar 1,Delhi found
data on. RWA triveni residents,Delhi found
data on. Dwarka Mor,Delhi found
data on. kst chattarpur Apartments,Delhi found
data on. Laxmi Nagar,Delhi found
data on. Kapi Bagan Basti,Delhi found
data on. Paryavaran Complex, Sainik Farm,Delhi found
data on. Aya Nagar,Delhi found
data on. Mukherjee Nagar,Delhi found
data on. Mehrauli,Delhi found
data on. Khanpur Extension, Sangam Vihar,Delhi found
data on. Sagar Pur,Delhi found
data on. Hastsal,Delhi found
data on. Kamla Nagar,Delhi found
data on. kst chattarpur Apartments,Delhi found
data on. Kamla Nagar,Delhi found
data on. Lajpat Nagar,Delhi found
data on. Saket,Delhi found
data on. Dwarka Mor,Delhi found
data on. Rajouri Garden,Delhi found
data on. Lajpat Nagar 4,Delhi found
data on. Prem Nagar, Patel Nagar,Delhi found
data on. Shadipur,Delhi found
data on. Krishna Nagar Block D,Delhi found
data on. Nawada,Delhi 

data on. Paschim Vihar,Delhi found
data on. Saket,Delhi found
data on. Pandav Nagar,Delhi found
data on. East Of Kailash,Delhi found
data on. Mayur Vihar Phase 1 Extension,Delhi found
data on. Najafgarh,Delhi found
data on. Vinod Nagar East,Delhi found
data on. kst chattarpur Apartments,Delhi found
data on. Ramesh Nagar,Delhi found
data on. Gautam Nagar,Delhi found
data on. Delhi estate Apartment,Delhi found
data on. Mahipalpur,Delhi found
data on. Dori Walan,Delhi found
data on. DS 19,Delhi found
data on. Defence Colony,Delhi found
data on. New Mahavir Nagar, Tilak Nagar,Delhi found
data on. north chajjupur shahdara,Delhi found
data on. Mahavir Enclave Part 1,Delhi found
data on. Janakpuri,Delhi found
data on. Burari,Delhi found
data on. Mehrauli,Delhi found
data on. Khanpur, Madangir,Delhi found
data on. Rohini Sector 11,Delhi found
data on. Chhattarpur,Delhi found
data on. Vasant Kunj,Delhi found
data on. Gaurav Apartment, Indraprastha Extension, Patparganj,Delhi found
data on. Mehr

data on. Pandav Nagar,Delhi found
data on. Pitampura,Delhi found
data on. Saket,Delhi found
data on. Safdarjung Enclave,Delhi found
data on. Greater Kailash 1,Delhi found
data on. Chhattarpur,Delhi found
data on. Chhattarpur,Delhi found
data on. Chhattarpur,Delhi found
data on. Chhattarpur,Delhi found
data on. Mayur Vihar Phase 1 Extension,Delhi found
data on. Kalkaji,Delhi found
data on. Neb Sarai,Delhi found
data on. Safdarjung Enclave,Delhi found
data on. Maharani Bagh, New Friends Colony,Delhi found
data on. Shalimar bagh,Delhi found
data on. Sarvodaya Enclave,Delhi found
data on. B-7 veer Singh colony Budh vihar phase 2 delhi,Delhi found
data on. Mahavir Enclave Part 3,Delhi found
data on. Dwarka Sector 5,Delhi found
data on. Vasant Kunj,Delhi found
data on. Pusa Institutional Area,Delhi found
data on. Raj Nagar 2,Delhi found
data on. Sarojini Nagar,Delhi found
data on. Lajpat Nagar,Delhi found
data on. Mayur Vihar 1,Delhi found
data on. Arjun Garh, Aya Nagar,Delhi found
data on. 

data on. Medavakkam,Chennai found
data on. Thiruporur,Chennai found
data on. Old Washermanpet,Chennai found
data on. Kazhipattur,Chennai found
data on. Gopalapuram,Chennai found
data on. Thanikachalam Nagar, Ponniammanmedu,Chennai found
data on. Kapaleeswarar Nagar, Neelankarai, E Coast Road,Chennai found
data on. Navalur,Chennai found
data on. Padur, Old Mahabalipuram Road,Chennai found
data on. Valasaravakkam, Arcot Road,Chennai found
data on. Anakaputhur,Chennai found
data on. Pudupakkam,Chennai found
data on. Ashok Nagar,Chennai found
data on. Perungalathur, Chennai Bypass Road,Chennai found
data on. Anna Nagar-Pammal,Chennai found
data on. Aminjikarai, PH Road,Chennai found
data on. Mannivakkam,Chennai found
data on. Kovilambakkam,Chennai found
data on. Teynampet,Chennai found
data on. Velachery,Chennai found
data on. Madras Boat Club Road,Chennai found
data on. R.A Puram, Mandaiveli,Chennai found
data on. AGS Colony-Velachery,Chennai found
data on. Tiruvallur, Kakkalur, Chennai,C

data on. Ayappakkam,Chennai found
data on. Chromepet, GST Road,Chennai found
data on. Arumbakkam,Chennai found
data on. Kasi Estate,Chennai found
data on. Elango Nagar-Virugambakkam,Chennai found
data on. Tondiarpet, Ennore High Road,Chennai found
data on. Perungalathur, Chennai Bypass Road,Chennai found
data on. Kodungaiyur West,Chennai found
data on. Nandanam Extension,Chennai found
data on. Mugalivakkam,Chennai found
data on. Triplicane,Chennai found
data on. Korattur, Jawaharlal Nehru Road,Chennai found
data on. Lanchor Abode valley,Chennai found
data on. Nesapakkam,Chennai found
data on. Urapakkam, Vandalur R.F, GST Road,Chennai found
data on. Baby Nagar Extention, Velachery,Chennai found
data on. Mogappair East,Chennai found
data on. Ambattur,Chennai found
data on. Padur, Old Mahabalipuram Road,Chennai found
data on. Mambalam West,Chennai found
data on. Iyyappanthangal,Chennai found
data on. Iyyappanthangal,Chennai found
data on. Porur,Chennai found
data on. Pammal,Chennai found


data on. Sriperumbudur,Chennai found
data on. Pudupakkam,Chennai found
data on. Thoraipakkam,Chennai found
data on. Ambattur,Chennai found
data on. Poonamallee,Chennai found
data on. Washermanpet,Chennai found
data on. Kattupakkam, PH Road,Chennai found
data on. Chitlapakkam,Chennai found
data on. Ashok Nagar,Chennai found
data on. Thiruneermalai,Chennai found
data on. Padur, Old Mahabalipuram Road,Chennai found
data on. Besant Nagar,Chennai found
data on. Ambattur,Chennai found
data on. Old Mahabalipuram Road,Chennai found
data on. R.A Puram, Mandaiveli,Chennai found
data on. Ambattur,Chennai found
data on. Mogappair East,Chennai found
data on. Choolaimedu,Chennai found
data on. MRC Nagar,Chennai found
data on. Sholinganallur,Chennai found
data on. Perungalathur, Chennai Bypass Road,Chennai found
data on. Anakaputhur,Chennai found
data on. Valasaravakkam, Arcot Road,Chennai found
data on. Kovilambakkam,Chennai found
data on. Poonamallee,Chennai found
data on. Urapakkam, Vandalur R.F, 

data on. Madambakkam,Chennai found
data on. Kodambakkam,Chennai found
data on. Kuthanur,Chennai found
data on. Mogappair West,Chennai found
data on. Sholinganallur,Chennai found
data on. Iyyappanthangal,Chennai found
data on. Vadapalani,Chennai found
data on. Kodungaiyur East,Chennai found
data on. Tambaram, GST Road,Chennai found
data on. Nanmangalam,Chennai found
data on. Madipakkam,Chennai found
data on. Sholinganallur,Chennai found
data on. Nandanam,Chennai found
data on. Nemilichery, Chromepet,Chennai found
data on. Bharathidasan Colony, KK Nagar,Chennai found
data on. Mambalam West,Chennai found
data on. Iyyappanthangal,Chennai found
data on. Mylapore,Chennai found
data on. Mugalivakkam,Chennai found
data on. Vadapalani,Chennai found
data on. Kayarambedu,Chennai found
data on. Chromepet, GST Road,Chennai found
data on. Purasaiwakkam,Chennai found
data on. Vadapalani,Chennai found
data on. Padapai,Chennai found
data on. Guindy Race Course, Guindy,Chennai found
data on. Mannivakkam

data on. Buddha Nagar Colony, Boduppal,Hyderabad found
data on. Banjara Hills, NH 9,Hyderabad found
data on. Amberpet,Hyderabad found
data on. KTR Colony,Hyderabad found
data on. Narayanguda,Hyderabad found
data on. Alwal,Hyderabad found
data on. Upparpally, Hyderabad Expressway,Hyderabad found
data on. Nizampet,Hyderabad found
data on. Bollaram, Outer Ring Road,Hyderabad found
data on. Nallagandla, Serilingampally,Hyderabad found
data on. in Syed Ali Guda,Hyderabad found
data on. Mallepally, NH 7,Hyderabad found
data on. ECIL,Hyderabad found
data on. Patrika Nagar, Hitech City,Hyderabad found
data on. Ramanthapur, NH 2 2,Hyderabad found
data on. Chanda Nagar,Hyderabad found
data on. Himayath Nagar, NH 7,Hyderabad found
data on. Seri Lingampally,Hyderabad found
data on. Nallagandla, Serilingampally,Hyderabad found
data on. Himayath Nagar, NH 7,Hyderabad found
data on. Himayath Nagar, NH 7,Hyderabad found
data on. Chandrayanguttabalguda,Hyderabad found
data on. Sanath Nagar, NH 9,Hydera

data on. Amberpet,Hyderabad found
data on. Toli Chowki,Hyderabad found
data on. Kondapur,Hyderabad found
data on. Ghatkesar, NH 2 2,Hyderabad found
data on. Prashanth hills,Hyderabad found
data on. Kachiguda, NH 2 2,Hyderabad found
data on. Sri BALAJI CLASSIC BHAVANI NAGAR RD NO 5,Hyderabad found
data on. Khairatabad, NH 7,Hyderabad found
data on. Ashok Nagar, Himayath Nagar,Hyderabad found
data on. Kondapur,Hyderabad found
data on. Banjara Hills, NH 9,Hyderabad found
data on. Gachibowli,Hyderabad found
data on. Gachibowli,Hyderabad found
data on. Safilguda, Secunderabad,Hyderabad found
data on. BHEL,Hyderabad found
data on. Nawab Saheb Kunta,Hyderabad found
data on. Kondapur,Hyderabad found
data on. Quthbullapur, NH 7,Hyderabad found
data on. Nizampet,Hyderabad found
data on. Subhash Nagar, Secunderabad,Hyderabad found
data on. MLA Colony, Banjara Hills,Hyderabad found
data on. Narsingi, Outer Ring Road,Hyderabad found
data on. Hayathnagar, NH 9,Hyderabad found
data on. Mehdipatnam,Hy

data on. Dammaiguda,Hyderabad found
data on. Habsiguda, NH 2 2,Hyderabad found
data on. Gachibowli,Hyderabad found
data on. Miyapur, NH 9,Hyderabad found
data on. Uppal, NH 2 2,Hyderabad found
data on. Hayathnagar, NH 9,Hyderabad found
data on. Attapur,Hyderabad found
data on. Bandlaguda Jagir,Hyderabad found
data on. Amberpet,Hyderabad found
data on. RTC Cross Road,Hyderabad found
data on. Himayath Nagar, NH 7,Hyderabad found
data on. Manikonda, Outer Ring Road,Hyderabad found
data on. Kothapet,Hyderabad found
data on. Anand Nagar-Khairatabad, NH 7,Hyderabad found
data on. Kondapur,Hyderabad found
data on. Kapra,Hyderabad found
data on. Chanda Nagar,Hyderabad found
data on. Rock Town Colony,Hyderabad found
data on. Hayathnagar, NH 9,Hyderabad found
data on. Boduppal, NH 2 2,Hyderabad found
data on. Attapur,Hyderabad found
data on. Medipally,Hyderabad found
data on. Pragathi Nagar, Kukatpally,Hyderabad found
data on. Meerpet,Hyderabad found
data on. Anand Nagar-Khairatabad, NH 7,Hydera

data on. Yeshwanthpur,Hyderabad found
data on. Rajendra Nagar, Outer Ring Road,Hyderabad found
data on. Financial District, Nanakram Guda,Hyderabad found
data on. Gachibowli,Hyderabad found
data on. Yousufguda, NH 9,Hyderabad found
data on. Deepthisri nagar colony,Hyderabad found
data on. Rampally,Hyderabad found
data on. Pocharam, NH 2 2,Hyderabad found
data on. Quthbullapur, NH 7,Hyderabad found
data on. Old Bowenpally,Hyderabad found
data on. Kapra,Hyderabad found
data on. Financial District, Nanakram Guda,Hyderabad found
data on. Adikmet,Hyderabad found
data on. Shaikpet,Hyderabad found
data on. Kondapur,Hyderabad found
data on. Kondapur,Hyderabad found
data on. K P H B Phase 4,Hyderabad found
data on. Nallagandla, Serilingampally,Hyderabad found
data on. Madhapur,Hyderabad found
data on. Madhapur,Hyderabad found
data on. Balanagar,Hyderabad found
data on. Dwarakapuri, Punjagutta, NH 9,Hyderabad found
data on. Khairatabad, NH 7,Hyderabad found
data on. Old Nallakunta,Hyderabad foun

data on. Uppal, NH 2 2,Hyderabad found
data on. Madhapur,Hyderabad found
data on. Sainikpuri,Hyderabad found
data on. Nagole,Hyderabad found
data on. BHEL,Hyderabad found
data on. Netaji Nagar Colony, Langar Houz,Hyderabad found
data on. Jagadgiri Gutta,Hyderabad found
data on. Hyderguda,Hyderabad found
data on. Bolarum, Medchal Road,Hyderabad found
data on. Nallagandla, Serilingampally,Hyderabad found
data on. Basheer Bagh, NH 7,Hyderabad found
data on. Basheer Bagh, NH 7,Hyderabad found
data on. Jubilee Hills,Hyderabad found
data on. K P H B Phase 9,Hyderabad found
data on. Saket, Secunderabad,Hyderabad found
data on. Suraram,Hyderabad found
data on. Manikonda, Outer Ring Road,Hyderabad found
data on. Vinayaka Nagar,Hyderabad found
data on. BN Reddy Nagar,Hyderabad found
data on. Miyapur, NH 9,Hyderabad found
data on. Raj Bhawan Road,Hyderabad found
data on. Almasguda,Hyderabad found
data on. Almasguda,Hyderabad found
data on. Godavari Homes, Quthbullapur,Hyderabad found
data on. Gac

In [13]:
# Dropping unneeded columns
House_Rent_df = House_Rent_df.drop(['Posted On', 'Floor', "no_floors", "Area Locality"], axis=1)

In [14]:
# Reset index
House_Rent_df = House_Rent_df.reset_index(drop=True)

In [15]:
# Renaming Column headers for better readability
House_Rent_df.rename(columns={"BHK": "bhk",
                                "Rent": "rent",
                                "Size": "size", 
                                "Area Type": "area_type",
                                "City": "city",
                                "Furnishing Status": "furnishing_status",
                                "Tenant Preferred": "tenant_preferred",
                                "Bathroom": "bathroom",
                                "Point of Contact": "point_of_contact", }, inplace = True)


# Replace values in df that are'-' and 'I/D' with a zero
House_Rent_df = House_Rent_df.replace(['-','I/D'],'0')

In [16]:
#Add new column to hold an id for each line
House_Rent_df['id'] = House_Rent_df.index+1

In [17]:
#Displaying the DataFrame
House_Rent_df.head()

Unnamed: 0,bhk,rent,size,area_type,city,furnishing_status,tenant_preferred,bathroom,point_of_contact,posted_on,floor_level,suburb,id
0,2,10000,1100,Super Area,Kolkata,Unfurnished,Bachelors/Family,2,Contact Owner,May,Ground,Bandel,1
1,2,20000,800,Super Area,Kolkata,Semi-Furnished,Bachelors/Family,1,Contact Owner,May,1,Kankurgachi,2
2,2,17000,1000,Super Area,Kolkata,Semi-Furnished,Bachelors/Family,1,Contact Owner,May,1,Sector II,3
3,2,10000,800,Super Area,Kolkata,Unfurnished,Bachelors/Family,1,Contact Owner,July,1,Dum Dum Park,4
4,2,7500,850,Carpet Area,Kolkata,Unfurnished,Bachelors,1,Contact Owner,May,1,South Dumdum,5


In [18]:
# Determine the number of unique values in each column.
House_Rent_df.nunique()

bhk                     6
rent                  243
size                  614
area_type               3
city                    6
furnishing_status       3
tenant_preferred        3
bathroom                8
point_of_contact        3
posted_on               4
floor_level            54
suburb               1851
id                   4739
dtype: int64

In [21]:
# Create grouped data on suburbs
rental_grouped = House_Rent_df.groupby("suburb").count().id

# Create a list with only 1 property listed. List will be used to drop from the df to unsure we do not skew the data
to_drop = rental_grouped.loc[(rental_grouped == 1)].index.tolist()

# Display number of sububs with 1 property listed
len(to_drop)

1113

In [23]:
# Create new df without suburbs that have 1 property listed
cleaned_House_Rent_df = House_Rent_df[~House_Rent_df['suburb'].isin(to_drop)]
cleaned_House_Rent_df.shape

(3626, 13)

In [24]:
# Reset index
cleaned_House_Rent_df = cleaned_House_Rent_df.reset_index(drop=True)

# Reset column to hold an id for each line
cleaned_House_Rent_df['id'] = cleaned_House_Rent_df.index+1

In [25]:
# Determine the number of unique values in each column.
cleaned_House_Rent_df.nunique()

bhk                     6
rent                  222
size                  531
area_type               3
city                    6
furnishing_status       3
tenant_preferred        3
bathroom                8
point_of_contact        3
posted_on               4
floor_level            51
suburb                738
id                   3626
dtype: int64

In [26]:
# Writing the result into testing.csv file
cleaned_House_Rent_df.to_csv('Resources/transformed.csv', index=False)