# San Francisco Rental Prices Dashboard

In this notebook, you will compile the visualizations from the previous analysis into functions that can be used for a Panel dashboard.

In [130]:
# imports
import panel as pn
pn.extension('plotly')
import plotly.express as px
import pandas as pd
import hvplot.pandas
import matplotlib.pyplot as plt
import os
import numpy as np
from pathlib import Path
from dotenv import load_dotenv

In [131]:
# Read the Mapbox API key
load_dotenv()
map_box_api = os.getenv("mapbox")
px.set_mapbox_access_token(map_box_api)

# Import Data

In [132]:
# Import the necessary CSVs to Pandas DataFrames
file_path = Path("Data/sfo_neighborhoods_census_data.csv")
sfo_data = pd.read_csv(file_path, index_col="year")
sfo_data.head()

Unnamed: 0_level_0,neighborhood,sale_price_sqr_foot,housing_units,gross_rent
year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
2010,Alamo Square,291.182945,372560,1239
2010,Anza Vista,267.932583,372560,1239
2010,Bayview,170.098665,372560,1239
2010,Buena Vista Park,347.394919,372560,1239
2010,Central Richmond,319.027623,372560,1239


In [133]:
new_sfo_data = sfo_data.reset_index('year')
new_sfo_data

Unnamed: 0,year,neighborhood,sale_price_sqr_foot,housing_units,gross_rent
0,2010,Alamo Square,291.182945,372560,1239
1,2010,Anza Vista,267.932583,372560,1239
2,2010,Bayview,170.098665,372560,1239
3,2010,Buena Vista Park,347.394919,372560,1239
4,2010,Central Richmond,319.027623,372560,1239
...,...,...,...,...,...
392,2016,Telegraph Hill,903.049771,384242,4390
393,2016,Twin Peaks,970.085470,384242,4390
394,2016,Van Ness/ Civic Center,552.602567,384242,4390
395,2016,Visitacion Valley,328.319007,384242,4390


- - -

## Panel Visualizations

In this section, you will copy the code for each plot type from your analysis notebook and place it into separate functions that Panel can use to create panes for the dashboard. 

These functions will convert the plot object to a Panel pane.

Be sure to include any DataFrame transformation/manipulation code required along with the plotting code.

Return a Panel pane object from each function that can be used to build the dashboard.

Note: Remove any `.show()` lines from the code. We want to return the plots instead of showing them. The Panel dashboard will then display the plots.

In [None]:
# Define Panel Visualization Functions
def housing_units_per_year():
housing_units_per_year= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "housing_units": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "housing_units"])

housing_units_per_year_plot = px.scatter(
    new_sfo_data,
    x="year",
    y="housing_units",
    color="sale_price_sqr_foot",
    title="San Fran, housing_units",
)

pane = pn.pane.Plotly(housing_units_per_year_plot)
pane





def average_gross_rent():
    """Average Gross Rent in San Francisco Per Year."""
    
gross_rent= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "gross_rent": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "gross_rent"])

gross_rent_plot = px.scatter(
    new_sfo_data,
    x="year",
    y="gross_rent",
    color="sale_price_sqr_foot",
    title="San Fran, gross_rent",
)

pane = pn.pane.Plotly(gross_rent_plot)
pane



def average_sales_price():
    """Average Sales Price Per Year."""

average_sales_price= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "neighborhood": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "sale_price_sqr_foot"])

average_sales_price_plot = px.scatter(
    new_sfo_data,
    x="sale_price_sqr_foot",
    y="neighborhood",
    color="year",
    title="San Fran, sale_price_sqr_foot",
)

pane = pn.pane.Plotly(average_sales_price_plot)
pane    
   



def average_price_by_neighborhood():
    """Average Prices by Neighborhood."""
average_rent= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "neighborhood": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "sale_price_sqr_foot"])

average_rent_plot = px.scatter(
    rental_plot_data1,
    x="year",
    y="gross_rent",
    color="neighborhood",
    title="San Fran, gross_rent",
)

pane = pn.pane.Plotly(average_rent_plot)
pane   
 



def top_most_expensive_neighborhoods():
most_expensive= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "neighborhood": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "sale_price_sqr_foot"])

most_expensive_plot = px.scatter(
    top_10_reset,
    x="year",
    y="sale_price_sqr_foot",
    color="neighborhood",
    title="San Fran, sale_price_sqr_foot",
)

pane = pn.pane.Plotly(most_expensive_plot)
pane


def most_expensive_neighborhoods_rent_sales():
    """Comparison of Rent and Sales Prices of Most Expensive Neighborhoods."""   
    
    # YOUR CODE HERE!

    
    
def parallel_coordinates():
    """Parallel Coordinates Plot."""

parallel_cooridinates= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "neighborhood": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "sale_price_sqr_foot"])

parallel_cooridinates_plot = px.scatter(
    merged_data,
    x="Lat",
    y="Lon",
    color="neighborhood",
    title="San Fran, neighborhood coordinates",
)

pane = pn.pane.Plotly(parallel_cooridinates_plot)
pane



def parallel_categories():
    """Parallel Categories Plot."""
    



def neighborhood_map():
    """Neighborhood Map."""

    # YOUR CODE HERE!


def sunburst():
    """Sunburst Plot."""
    
    # YOUR CODE HERE!


## Panel Dashboard

In this section, you will combine all of the plots into a single dashboard view using Panel. Be creative with your dashboard design!

In [158]:
# Create a Title for the Dashboard
column = pn.Column(
    '# San Francisco Real Estate Market Statistics')
column


# Create a tab layout for the dashboard
tabs = pn.Tabs(
    ("housing_units_per_year", housing_units_per_year_plot),
    ("gross_rent", gross_rent_plot),
    ("average_sales_price", average_sales_price_plot),
    ("average_rent", average_rent_plot),
    ("10_most_expensive", most_expensive_plot),
    ("parallel_cooridinates", parallel_cooridinates_plot)
    
)
tabs

# Create the dashboard
# YOUR CODE HERE!

## Serve the Panel Dashboard

In [None]:
# Serve the# dashboard
# YOUR CODE HERE!

# Debugging

Note: Some of the Plotly express plots may not render in the notebook through the panel functions.

However, you can test each plot by uncommenting the following code

In [149]:
#housing_units_per_year()
housing_units_per_year= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "housing_units": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "housing_units"])

housing_units_per_year_plot = px.scatter(
    new_sfo_data,
    x="year",
    y="housing_units",
    color="sale_price_sqr_foot",
    title="San Fran, housing_units",
)

pane = pn.pane.Plotly(housing_units_per_year_plot)
pane



In [148]:
# average_gross_rent()
gross_rent= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "gross_rent": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "gross_rent"])

gross_rent_plot = px.scatter(
    new_sfo_data,
    x="year",
    y="gross_rent",
    color="sale_price_sqr_foot",
    title="San Fran, gross_rent",
)

pane = pn.pane.Plotly(gross_rent_plot)
pane

In [136]:
# average_sales_price()
average_rent_df= sfo_data.groupby(["year","neighborhood"]).mean()
average_rent_df.head()

Unnamed: 0_level_0,Unnamed: 1_level_0,sale_price_sqr_foot,housing_units,gross_rent
year,neighborhood,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
2010,Alamo Square,291.182945,372560,1239
2010,Anza Vista,267.932583,372560,1239
2010,Bayview,170.098665,372560,1239
2010,Buena Vista Park,347.394919,372560,1239
2010,Central Richmond,319.027623,372560,1239


In [137]:
# average_price_by_neighborhood()

In [138]:
average_sales_price= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "neighborhood": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "sale_price_sqr_foot"])

average_sales_price_plot = px.scatter(
    plot_data1,
    x="year",
    y="sale_price_sqr_foot",
    color="neighborhood",
    title="San Fran, sale_price_sqr_foot",
)

pane = pn.pane.Plotly(average_sales_price_plot)
pane

In [139]:
avg_hood_cost = plot_data1.groupby(["year","neighborhood"]).mean()
avg_hood_cost.head()
avg_hood_cost_sorted= avg_hood_cost.sort_values(['sale_price_sqr_foot'], ascending=[False])
avg_hood_cost_sorted.head(10)
top_10 = avg_hood_cost_sorted.head(10)
top_10_reset = top_10.reset_index()
top_10_reset

Unnamed: 0,year,neighborhood,sale_price_sqr_foot
0,2015,Union Square District,2258.702832
1,2016,Presidio Heights,1465.968586
2,2016,Merced Heights,1416.666667
3,2013,Union Square District,1290.472107
4,2014,Miraloma Park,1267.766203
5,2016,Parnassus/Ashbury Heights,1207.997485
6,2016,Outer Richmond,1196.645437
7,2015,Marina,1132.837361
8,2014,South of Market,1119.838877
9,2015,Corona Heights,1100.791194


In [140]:
most_expensive= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "neighborhood": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "sale_price_sqr_foot"])

most_expensive_plot = px.scatter(
    top_10_reset,
    x="year",
    y="sale_price_sqr_foot",
    color="neighborhood",
    title="San Fran, sale_price_sqr_foot",
)

pane = pn.pane.Plotly(most_expensive_plot)
pane

In [141]:
# neighborhood_map().show()

rental_plot_data= average_rent_df.drop(columns= ["sale_price_sqr_foot", "housing_units"])
rental_plot_data1= rental_plot_data.reset_index()
rental_plot_data1.head()

Unnamed: 0,year,neighborhood,gross_rent
0,2010,Alamo Square,1239
1,2010,Anza Vista,1239
2,2010,Bayview,1239
3,2010,Buena Vista Park,1239
4,2010,Central Richmond,1239


In [142]:
average_rent= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "neighborhood": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "sale_price_sqr_foot"])

average_rent_plot = px.scatter(
    rental_plot_data1,
    x="year",
    y="gross_rent",
    color="neighborhood",
    title="San Fran, gross_rent",
)

pane = pn.pane.Plotly(average_rent_plot)
pane

In [143]:
file_path1 = Path("Data/neighborhoods_coordinates.csv")
sfo_data1 = pd.read_csv(file_path1)
sfo_data1.head()
average_rent_df1= average_rent_df.reset_index()
average_rent_df1
plot_data_graph = plot_data1.hvplot(title="Average price per sq ft by neighborhood",groupby="neighborhood",x="year",y="sale_price_sqr_foot")
plot_data_graph
row_of_bar = pn.Row(plot_data_graph)
row_of_bar.append(rental_plot_data1)
row_of_bar
merged_data= pd.concat([average_rent_df1,sfo_data1], axis="columns", join="inner")
merged_data

Unnamed: 0,year,neighborhood,sale_price_sqr_foot,housing_units,gross_rent,Neighborhood,Lat,Lon
0,2010,Alamo Square,291.182945,372560,1239,Alamo Square,37.791012,-122.402100
1,2010,Anza Vista,267.932583,372560,1239,Anza Vista,37.779598,-122.443451
2,2010,Bayview,170.098665,372560,1239,Bayview,37.734670,-122.401060
3,2010,Buena Vista Park,347.394919,372560,1239,Bayview Heights,37.728740,-122.410980
4,2010,Central Richmond,319.027623,372560,1239,Bernal Heights,37.728630,-122.443050
...,...,...,...,...,...,...,...,...
68,2011,Croker Amazon,145.853380,374507,1530,West Portal,37.740260,-122.463880
69,2011,Diamond Heights,382.352261,374507,1530,Western Addition,37.792980,-122.435790
70,2011,Downtown,234.281624,374507,1530,Westwood Highlands,37.734700,-122.456854
71,2011,Duboce Triangle,295.779378,374507,1530,Westwood Park,37.734150,-122.457000


In [144]:
parallel_cooridinates= pd.DataFrame(
    {
        "year": np.random.randint(2010, 2016, 100),
        "neighborhood": np.random.randint(372560, 385000, 100),
        "sale_price_sqr_foot": np.random.randint(100, 1500, 100),
    }
).sort_values(["year", "sale_price_sqr_foot"])

parallel_cooridinates_plot = px.scatter(
    merged_data,
    x="Lat",
    y="Lon",
    color="neighborhood",
    title="San Fran, neighborhood coordinates",
)

pane = pn.pane.Plotly(parallel_cooridinates_plot)
pane

In [160]:
average_rent_df1

Unnamed: 0,year,neighborhood,sale_price_sqr_foot,housing_units,gross_rent
0,2010,Alamo Square,291.182945,372560,1239
1,2010,Anza Vista,267.932583,372560,1239
2,2010,Bayview,170.098665,372560,1239
3,2010,Buena Vista Park,347.394919,372560,1239
4,2010,Central Richmond,319.027623,372560,1239
...,...,...,...,...,...
392,2016,Telegraph Hill,903.049771,384242,4390
393,2016,Twin Peaks,970.085470,384242,4390
394,2016,Van Ness/ Civic Center,552.602567,384242,4390
395,2016,Visitacion Valley,328.319007,384242,4390


In [167]:
# parallel_categories()

parallel_categories = px.parallel_categories(
        average_rent_df1,
        dimensions=["neighborhood", "sale_price_sqr_foot", "housing_units", "gross_rent"],
        color="year",
        color_continuous_scale=px.colors.sequential.Inferno,
        labels={
            "neighborhood": "Neighborhood",
            "sale_price_sqr_foot": "Sale_price_sqr_foot",
            "housing_units": "Housing_units",
            "gross_rent": "Gross_rent",
        },
        width=1200,
    )
pane = pn.pane.Plotly(parallel_categories)
pane

In [None]:
# parallel_coordinates()

In [None]:
# sunburst()

In [156]:
column = pn.Column(
    '# San Francisco Real Estate Market Statistics')
column

In [157]:
tabs = pn.Tabs(
    ("housing_units_per_year", housing_units_per_year_plot),
    ("gross_rent", gross_rent_plot),
    ("average_sales_price", average_sales_price_plot),
    ("average_rent", average_rent_plot),
    ("10_most_expensive", most_expensive_plot),
    ("parallel_cooridinates", parallel_cooridinates_plot)
    
)
tabs


In [154]:
row = pn.Row(housing_units_per_year_plot, gross_rent_plot, average_sales_price_plot, average_rent_plot, 
             most_expensive_plot, parallel_cooridinates_plot)
row