# San Francisco Rental Prices Dashboard

In this notebook, you will compile the visualizations from the previous analysis into functions that can be used for a Panel dashboard.

In [28]:
# imports
import panel as pn
pn.extension('plotly')
import plotly.express as px
import pandas as pd
import hvplot.pandas
import matplotlib.pyplot as plt
import os
from pathlib import Path
from dotenv import load_dotenv

In [29]:
# Read the Mapbox API key
load_dotenv()
map_box_api = os.getenv("mapbox")
px.set_mapbox_access_token(map_box_api)

# Import Data

In [30]:
# Import the necessary CSVs to Pandas DataFrames
file_path = Path("Data/sfo_neighborhoods_census_data.csv")
sfo_data = pd.read_csv(file_path, index_col = "year")

# check for NA values
number_of_na = sfo_data.isna().sum().sum()
print(f"Number of NA values in the SFO Census DataFrame: {number_of_na}")

# check for null values
number_of_nulls = sfo_data.isnull().sum().sum()
print(f"Number of NULL values in the SFO Census DataFrame: {number_of_nulls}")

# Dropping NA and NULL values
sfo_data.dropna(inplace = True)

number_of_na = sfo_data.isna().sum().sum()
print(f"Number of NA values after drop function is applied: {number_of_na}")

# Check for NULL values after drop function
number_of_nulls = sfo_data.isnull().sum().sum()
print(f"Number of NULL values after drop function is applied: {number_of_nulls}")

Number of NA values in the SFO Census DataFrame: 5
Number of NULL values in the SFO Census DataFrame: 5
Number of NA values after drop function is applied: 0
Number of NULL values after drop function is applied: 0


In [31]:
# Load in neighborhoods coordinates data and setup a DataFrame
file_path = Path("Data/neighborhoods_coordinates.csv")

coordinate_data_df = pd.read_csv(file_path)
coordinate_data_df.columns = ["neighborhood", "lat", "lon"]
coordiante_data_df = coordinate_data_df.set_index("neighborhood")

# checking for NA values
number_of_na_coordiante_data = coordinate_data_df.isna().sum().sum()
print(f"Number of NA values in the coordinate data: {number_of_na_coordiante_data}")

# checking for NULL values
number_of_nulls_coordinate_data = coordinate_data_df.isnull().sum().sum()
print(f"Number of NULL values in the coordinate data: {number_of_nulls_coordinate_data}")

Number of NA values in the coordinate data: 0
Number of NULL values in the coordinate data: 0


# Global DataFrames (used in multiple graphs)

In [35]:
# Create global DataFrames to improve code preformance these DF's are used in multiple graphs to plot the data

# group by year and neighborhood and create a DataFrame with all of the mean values
means = sfo_data.groupby(["year", "neighborhood"]).mean()
means_df = pd.DataFrame(means)

# make a dataframe for sales price per neighborhood, housing units and gross rent for each neighborhood (mean)
mean_values_neighborhood = sfo_data.groupby(["neighborhood"]).mean()
mean_values_neighborhood_df = pd.DataFrame(mean_values_neighborhood)

# filter out the 10 most expensive neighborhoods for sales price per sq ft
top_10_mean_sale_price_of_neighborhood_df = mean_values_neighborhood_df.nlargest(10, "sale_price_sqr_foot")

# reset the index for the top 10 neighborhoods per sq foot dataframe
top_10__mean_sale_price_of_neighborhood_no_index_df = top_10_mean_sale_price_of_neighborhood_df.reset_index()

# list the top 10 neighborhoods
top_ten_ = top_10_mean_sale_price_of_neighborhood_df["neighborhood"].tolist()

# reset and create a dataframe from the original DF (sfo_data) without an index
sfo_data_no_index = sfo_data.reset_index()

# selecting a subject containing the top 10 neighborhood names from (sfo_data_no_index)
yearly_change_of_rent_and_price_top_10_no_index = sfo_data_no_index[sfo_data_no_index["neighborhood"].isin(top_10_neighborhoods)]

# setting the index of the top 10 neighborhood data with yearly variation included in the neighborhoods
yearly_change_of_rent_and_price_top_10 = yearly_change_of_rent_and_price_top_10_n_index.set_index(["neighborhood"])

# join the average values with the neighborhood locations
combined_sfo_df = pd.concat([mean_values_neighborhood_df, coordinate_data_df], axis = "columns", join = "inner")
combined_sfo_df.head()

# remove the index of the combined dataframe
combined_sfo_no_index = combined_sfo_df.reset_index()

# print and view the dataframe
combined_sfo_no_index.head()

KeyError: 'neighborhood'

## Panel Visualizations

In this section, you will copy the code for each plot type from your analysis notebook and place it into separate functions that Panel can use to create panes for the dashboard. 

These functions will convert the plot object to a Panel pane.

Be sure to include any DataFrame transformation/manipulation code required along with the plotting code.

Return a Panel pane object from each function that can be used to build the dashboard.

Note: Remove any `.show()` lines from the code. We want to return the plots instead of showing them. The Panel dashboard will then display the plots.

In [None]:
# Define Panel Visualization Functions
def housing_units_per_year():
    """Housing Units Per Year."""
    
    average_housing_units_per_year = sfo_data["housing_units"].groupby(["year"]).mean()
    average_housing_units_per_year_df = pd.DataFrame(average_housing_units_per_year)
    average_housing_units_per_year_df.head()

    average_housing_units_per_year_df.hvplot.bar
        (xlabel = "Year", 
         ylabel = "Average Housing Units", 
         ylim = (370000, 385000), 
         title = "Average Annual Housing Unit Occupation in San Francisco\n"
    )
    return housing_units_per_year_plot
        
        
def average_gross_rent():
    """Average Gross Rent in San Francisco Per Year."""
    
    # YOUR CODE HERE!



def average_sales_price():
    """Average Sales Price Per Year."""
    
    # YOUR CODE HERE!



def average_price_by_neighborhood():
    """Average Prices by Neighborhood."""
    
    # YOUR CODE HERE!



def top_most_expensive_neighborhoods():
    """Top 10 Most Expensive Neighborhoods."""

    # YOUR CODE HERE!


def most_expensive_neighborhoods_rent_sales():
    """Comparison of Rent and Sales Prices of Most Expensive Neighborhoods."""   
    
    # YOUR CODE HERE!

    
    
def parallel_coordinates():
    """Parallel Coordinates Plot."""

    # YOUR CODE HERE!



def parallel_categories():
    """Parallel Categories Plot."""
    
    # YOUR CODE HERE!



def neighborhood_map():
    """Neighborhood Map."""

    # YOUR CODE HERE!


def sunburst():
    """Sunburst Plot."""
    
    # YOUR CODE HERE!


## Panel Dashboard

In this section, you will combine all of the plots into a single dashboard view using Panel. Be creative with your dashboard design!

In [None]:
# Create a Title for the Dashboard
occupation_rent_column = pn.Column(
    "##"
)

# Create a tab layout for the dashboard
# YOUR CODE HERE!


# Create the dashboard
# YOUR CODE HERE!

## Serve the Panel Dashboard

In [None]:
# Serve the# dashboard
# YOUR CODE HERE!

# Debugging

Note: Some of the Plotly express plots may not render in the notebook through the panel functions.

However, you can test each plot by uncommenting the following code

In [None]:
# housing_units_per_year()

In [None]:
# average_gross_rent()

In [None]:
# average_sales_price()

In [None]:
# average_price_by_neighborhood()

In [None]:
# top_most_expensive_neighborhoods()

In [None]:
# most_expensive_neighborhoods_rent_sales()

In [None]:
# neighborhood_map().show()

In [None]:
# parallel_categories()

In [None]:
# parallel_coordinates()

In [None]:
# sunburst()