# San Francisco Rental Prices Dashboard

In this notebook, you will compile the visualizations from the previous analysis into functions that can be used for a Panel dashboard.

In [7]:
# imports
import panel as pn
pn.extension('plotly')
import plotly.express as px
import pandas as pd
import hvplot.pandas
import matplotlib.pyplot as plt
import os
from pathlib import Path
from dotenv import load_dotenv
from panel.interact import interact

In [2]:
# Read the Mapbox API key
load_dotenv()
mapbox_token = os.getenv("MAPBOX_API_KEY")
px.set_mapbox_access_token(mapbox_token)

# Import Data

In [3]:
# Import the CSVs to Pandas DataFrames
file_path = Path("Data/sfo_neighborhoods_census_data.csv")
sfo_data = pd.read_csv(file_path, index_col="year")

file_path = Path("Data/neighborhoods_coordinates.csv")
df_neighborhood_locations = pd.read_csv(file_path)

- - -

## Panel Visualizations

In this section, you will copy the code for each plot type from your analysis notebook and place it into separate functions that Panel can use to create panes for the dashboard. 

These functions will convert the plot object to a Panel pane.

Be sure to include any DataFrame transformation/manipulation code required along with the plotting code.

Return a Panel pane object from each function that can be used to build the dashboard.

Note: Remove any `.show()` lines from the code. We want to return the plots instead of showing them. The Panel dashboard will then display the plots.

In [4]:
# Define Panel Visualization Functions
def housing_units_per_year():
    """Housing Units Per Year."""
    # Calculating the mean number of housing units per year
    annual_units = sfo_data.groupby("year")["housing_units"].mean()
    au_max = max(annual_units)
    au_min = min(annual_units)
    au_std = annual_units.std()
    
    # Plotting using matplotlib as bar chart
    fig_housing_units = annual_units.plot.bar(ylim = [au_min - au_std,au_max + au_std], title = "Housing Units in San Francisco from 2010 to 2016")
    plt.xlabel("Year")
    plt.ylabel("Housing Units")
    plt.close()
    
    return fig_housing_units

def average_gross_rent():
    """Average Gross Rent in San Francisco Per Year."""
    # Calculate the average gross rent and average sale price per square foot
    avg_rent_sqft = sfo_data.groupby("year")["sale_price_sqr_foot", "gross_rent"].mean()
    
    # Plotting using matplotlib as line chart
    fig_avg_rent = avg_rent_sqft["gross_rent"].plot(title = "Average Gross Rent in San Francisco")
    plt.xlabel("Year")
    plt.ylabel("Average Gross Rent")
    plt.close()

    return fig_avg_rent

def average_sales_price():
    """Average Sales Price Per Year."""
    # Calculate the average gross rent and average sale price per square foot
    avg_rent_sqft = sfo_data.groupby("year")["sale_price_sqr_foot", "gross_rent"].mean()
    
    # Plotting using matplotlib as line chart
    fig_avg_sale = avg_rent_sqft["sale_price_sqr_foot"].plot(title = "Average Sale Price per Square Foot in San Francisco")
    plt.xlabel("Year")
    plt.ylabel("Average Sale Price")
    plt.close()
    
    return fig_avg_sale

def average_price_by_neighborhood(neighborhood):
    """Average Prices by Neighborhood."""
    # Dataframe with mean values grouped by year and neighborhood
    price_by_nh = sfo_data.groupby(["year", "neighborhood"])["sale_price_sqr_foot", "housing_units", "gross_rent"].mean()
    price_by_nh.reset_index(inplace = True)

    # Plotting 
    select_neighborhood = price_by_nh.loc[price_by_nh["neighborhood"] == neighborhood]
    avg_price_hvplot = select_neighborhood["sale_price_sqr_foot"].hvplot.line(title = ("Average Price per Sq Ft for " + neighborhood))
    
    return avg_price_hvplot

def top_most_expensive_neighborhoods():
    """Top 10 Most Expensive Neighborhoods."""
    # Identifying the top 10 most expensive neighborhoods
    avg_sale_price = sfo_data.groupby("neighborhood").mean()
    avg_sale_price.sort_values("sale_price_sqr_foot", ascending = False, inplace = True)
    avg_sale_price.reset_index(inplace = True)
    top_ten_sale_price = avg_sale_price.iloc[0:10,:]

    # Plotting the data from the top 10 expensive neighborhoods
    top_ten_sale_price_plot = top_ten_sale_price.hvplot.bar(x = "neighborhood", xlabel = "Neighborhood", y = "sale_price_sqr_foot", ylabel = "Avg. Sale Price per Square Foot",title = "Top 10 Expensive Neighborhoods in San Francisco", rot = 90, height=500)

    return top_ten_sale_price_plot

def parallel_coordinates():
    """Parallel Coordinates Plot."""
    # Identifying the top 10 most expensive neighborhoods
    avg_sale_price = sfo_data.groupby("neighborhood").mean()
    avg_sale_price.sort_values("sale_price_sqr_foot", ascending = False, inplace = True)
    avg_sale_price.reset_index(inplace = True)
    top_ten_sale_price = avg_sale_price.iloc[0:10,:]

    # Parallel Coordinates Plot
    top_ten_pcoord = px.parallel_coordinates(top_ten_sale_price, color = "sale_price_sqr_foot", color_continuous_scale = px.colors.diverging.Portland)
    
    return top_ten_pcoord

def parallel_categories():
    """Parallel Categories Plot."""
    # Identifying the top 10 most expensive neighborhoods
    avg_sale_price = sfo_data.groupby("neighborhood").mean()
    avg_sale_price.sort_values("sale_price_sqr_foot", ascending = False, inplace = True)
    avg_sale_price.reset_index(inplace = True)
    top_ten_sale_price = avg_sale_price.iloc[0:10,:]

    # Parallel Categories Plot
    top_ten_pcat = px.parallel_categories(top_ten_sale_price, color = "sale_price_sqr_foot", color_continuous_scale = px.colors.diverging.Spectral)
    
    return top_ten_pcat

def neighborhood_map():
    """Neighborhood Map"""
    # Calculate the mean values for each neighborhood
    avg_value_nh = sfo_data.groupby("neighborhood").mean()
    avg_value_nh.reset_index(inplace = True)
    avg_value_nh.head()
    
    # Join the average values with the neighborhood locations
    avg_value_nh_loc = pd.concat([df_neighborhood_locations, avg_value_nh], axis = "columns", join = "inner")
    avg_value_nh_loc.drop(columns = "neighborhood", inplace = True)
    avg_value_nh_loc.head()
    
    # Create a scatter mapbox to analyze neighborhood info
    map_plot = px.scatter_mapbox(
        avg_value_nh_loc,
        lat = "Lat",
        lon = "Lon",
        size = "sale_price_sqr_foot",
        color = "gross_rent",
        zoom = 11,
        color_continuous_scale = px.colors.cyclical.IceFire
    )
    
    return map_plot


## Panel Dashboard

In this section, you will combine all of the plots into a single dashboard view using Panel. Be creative with your dashboard design!

In [5]:
# Welcome Tab
welcome = pn.Column(
    """This dashboard presents a visual analysis of historical prices of house units, 
    sale price per square foot and gross rent in San Francisco, CA from 2010 to 2016. 
    You can navigate through the tabs above to explore more details about the evolution
    of the real estate market on The Golden City across these years.""",
    neighborhood_map()
)

# Yearly Market Analysis Tab
yearly_analysis = pn.Row(
    housing_units_per_year().figure,
    average_gross_rent().figure,
    average_sales_price().figure
)

# Neighborhood Analysis Tab
neighborhoods = sfo_data.groupby("neighborhood").count().index.tolist()
widget = interact(average_price_by_neighborhood, neighborhood = neighborhoods)
nh_analysis = pn.Column(
        widget,
        top_most_expensive_neighborhoods()
)

# Parallel Plots Analysis
parallels = pn.Column(
    parallel_coordinates,
    parallel_categories
)

plot_as_tab = pn.Tabs(("Welcome", welcome),("Yearly Market Analysis", yearly_analysis),("Neighborhood Analysis", nh_analysis), ("Parallel Plots Analysis", parallels))

## Serve the Panel Dashboard

In [8]:
plot_as_tab.servable()