In [None]:
# Spatial Distribution of San Francisco's Parks and Recreation spaces, city owned
# Prepared by Elizabeth Owen (Individual Project)
# The purpose of this analysis is to visualize where access to recreation space exists (and does not exist) in San Francisco

In [2]:
# First, we need to import commands to visualize our data:

# for general data wrangling tasks
import pandas as pd

# to read and visualize spatial data
import geopandas as gpd

# to provide basemaps 
import contextily as ctx

# to give more power to your figures (plots)
import matplotlib.pyplot as plt

In [3]:
# Import parks file
parks = gpd.read_file('SF_Recreation and Parks Properties.geojson')

In [None]:
# How many rows and columns of data?
parks.shape

In [None]:
# What does the data look like?
parks.head()

In [None]:
# Let's visualize the dataset
parks.plot(figsize=(100,100))

In [None]:
# Remove the county data row
parks = parks.drop([0])

In [None]:
parks.head()

In [None]:
# Now we can visualize the cleaned up data
parks.head()

In [None]:
parks['propertytype'].describe()

In [None]:
parks['propertytype'].value_counts()

In [None]:
parks_count = parks['propertytype'].value_counts()
parks_count

In [None]:
parks_count = parks_count.reset_index()
parks_count

In [None]:
parks_count.plot.scatter(x="index", y="propertytype", alpha=0.9)

In [None]:
parks_count.plot.bar(x = 'index', y = 'propertytype', title = 'City of SF Parks and Rec Spaces')

In [None]:
parks.plot(figsize=(200,200),
                 column='propertytype',
                 legend=True, 
                 scheme='NaturalBreaks')
