# Real estate report - Selection and Frequency

In [21]:
import pandas as pd
df_realestate = pd.read_csv('data/aluguel.csv', sep=';')
df_realestate.head()

Unnamed: 0,Tipo,Bairro,Quartos,Vagas,Suites,Area,Valor,Condominio,IPTU
0,Quitinete,Copacabana,1,0,0,40,1700.0,500.0,60.0
1,Casa,Jardim Botânico,2,0,1,100,7000.0,,
2,Conjunto Comercial/Sala,Barra da Tijuca,0,4,0,150,5200.0,4020.0,1111.0
3,Apartamento,Centro,1,0,0,15,800.0,390.0,20.0
4,Apartamento,Higienópolis,1,0,0,48,800.0,230.0,


## 1. how many apartments are in the database

In [7]:
df_apartment = df_realestate.query('Tipo=="Apartamento"')
print("There are {} apartments in the database".format(len(df_apartment)))

There are 19532 apartments in the database


## 2. how many Casa, Casa de Condominio, Casa de Vila are in the database

In [11]:

df_casa = df_realestate.query('Tipo in ("Casa", "Casa de Condomínio", "Casa de Vila")')
print("There are {} houses in the database".format(df_casa.shape[0]))

There are 2212 houses in the database


In [16]:
# another approach for same selection
casa_selection = (df_realestate['Tipo'] == "Casa") | (df_realestate['Tipo'] == "Casa de Condomínio")  | (df_realestate['Tipo'] == "Casa de Vila")
df_casa = df_realestate[casa_selection]
df_casa

Unnamed: 0,Tipo,Bairro,Quartos,Vagas,Suites,Area,Valor,Condominio,IPTU
1,Casa,Jardim Botânico,2,0,1,100,7000.0,,
7,Casa de Condomínio,Barra da Tijuca,5,4,5,750,22000.0,,
8,Casa de Condomínio,Ramos,2,2,0,65,1000.0,,
18,Casa de Condomínio,Taquara,3,1,1,115,2000.0,,
22,Casa de Condomínio,Barra da Tijuca,4,3,2,466,7500.0,2695.0,
31,Casa,Campo Grande,4,1,2,400,12000.0,,
59,Casa de Condomínio,Barra da Tijuca,5,10,5,1600,25000.0,1600.0,
74,Casa,Méier,2,0,0,51,1500.0,50.0,
82,Casa,São Conrado,4,2,4,730,28000.0,2000.0,12000.0
85,Casa de Condomínio,Freguesia (Jacarepaguá),5,3,1,140,2500.0,1200.0,


## 3. how many real estates with Area between 60 and 100 meters

In [24]:
area_selection = (df_realestate['Area'] >= 60) & (df_realestate['Area'] <= 100)
df_area = df_realestate[area_selection]
print("There are {} real estate between 60 and 100 meters in the database".format(df_area.shape[0]))

There are 10187 houses in the database


## 4. Show real estate with 4 bedrooms and rent less than 2000.00

In [22]:
bed_and_price_selection = (df_realestate['Quartos']==4) & (df_realestate['Valor'] < 2000)
df_bed_and_price = df_realestate[bed_and_price_selection]
df_bed_and_price

Unnamed: 0,Tipo,Bairro,Quartos,Vagas,Suites,Area,Valor,Condominio,IPTU
701,Apartamento,Recreio dos Bandeirantes,4,2,2,160,1900.0,830.0,
1465,Apartamento,Taquara,4,1,1,110,1900.0,,
2874,Casa,Campo Grande,4,1,4,100,1600.0,,
3075,Casa,Engenho de Dentro,4,3,0,120,1500.0,,
3218,Apartamento,Recreio dos Bandeirantes,4,2,2,125,1700.0,,90.0
3419,Casa de Vila,Méier,4,0,1,85,1600.0,,
5849,Casa,Campo Grande,4,1,0,140,1700.0,,
5852,Apartamento,Campo Grande,4,2,1,115,1900.0,500.0,
6456,Apartamento,Recreio dos Bandeirantes,4,2,1,105,1900.0,1492.0,205.0
7520,Apartamento,Cidade Nova,4,0,0,110,1300.0,,


In [23]:
# renaming columns to english
df_bed_and_price.columns = ["Type", "Location", "Bedrooms", "Parking spots", "Suite", "Area", "Rent", "Condo fee", "City fee"]
df_bed_and_price

Unnamed: 0,Type,Location,Bedrooms,Parking spots,Suite,Area,Rent,Condo fee,City fee
701,Apartamento,Recreio dos Bandeirantes,4,2,2,160,1900.0,830.0,
1465,Apartamento,Taquara,4,1,1,110,1900.0,,
2874,Casa,Campo Grande,4,1,4,100,1600.0,,
3075,Casa,Engenho de Dentro,4,3,0,120,1500.0,,
3218,Apartamento,Recreio dos Bandeirantes,4,2,2,125,1700.0,,90.0
3419,Casa de Vila,Méier,4,0,1,85,1600.0,,
5849,Casa,Campo Grande,4,1,0,140,1700.0,,
5852,Apartamento,Campo Grande,4,2,1,115,1900.0,500.0,
6456,Apartamento,Recreio dos Bandeirantes,4,2,1,105,1900.0,1492.0,205.0
7520,Apartamento,Cidade Nova,4,0,0,110,1300.0,,
