In [2]:
%matplotlib notebook

# Dependencies
from matplotlib import pyplot as plt
from scipy import stats
import numpy as np
import pandas as pd
import import_ipynb
import matplotlib.patches as mpatches

In [3]:
# Load files and remove lat and lng
google_maps_df = pd.read_csv("Google_resources/Output/googlemaps_final2.csv")
public_transportation_df = google_maps_df.drop(columns=["Lat", "Lng"])
public_transportation_df

Unnamed: 0,CITY,STATE,bus_station,train_station,transit_station,subway_station,airport,taxi_stand
0,New York,NY,60,22,60,60,38,11
1,Los Angeles,CA,60,5,60,14,35,4
2,Chicago,IL,60,22,60,60,17,2
3,Houston,TX,60,1,60,0,45,0
4,Phoenix,AZ,60,4,60,0,34,1
5,Philadelphia,PA,60,40,60,49,29,0
6,San Antonio,TX,60,1,60,0,13,1
7,San Diego,CA,60,4,60,0,23,0
8,Dallas,TX,60,3,60,0,26,1
9,San Jose,CA,60,6,60,0,21,3


In [4]:
# Calculate sum of transportation services and add to prior df
sum_public_transportation = public_transportation_df.sum(axis=1)
sum_public_transportation_df = sum_public_transportation.to_frame()
sum_public_transportation_df.columns = ["sum of public transportation"]
sum_public_transportation_df

public_transportation_df = pd.merge(public_transportation_df, sum_public_transportation_df, right_index=True, left_index=True)
public_transportation_df

Unnamed: 0,CITY,STATE,bus_station,train_station,transit_station,subway_station,airport,taxi_stand,sum of public transportation
0,New York,NY,60,22,60,60,38,11,251
1,Los Angeles,CA,60,5,60,14,35,4,178
2,Chicago,IL,60,22,60,60,17,2,221
3,Houston,TX,60,1,60,0,45,0,166
4,Phoenix,AZ,60,4,60,0,34,1,159
5,Philadelphia,PA,60,40,60,49,29,0,238
6,San Antonio,TX,60,1,60,0,13,1,135
7,San Diego,CA,60,4,60,0,23,0,147
8,Dallas,TX,60,3,60,0,26,1,150
9,San Jose,CA,60,6,60,0,21,3,150


In [12]:
# Plot bar graph of sum_public_transportation by city
plt.figure("Public Transportation by City")
plt.title("Public Transportation by City")
x_axis = np.arange(len(public_transportation_df))
tick_locations = [value for value in x_axis]
plt.bar(x_axis, public_transportation_df["sum of public transportation"], color="red", alpha=0.5, align="center")
plt.xticks(tick_locations, public_transportation_df["CITY"], rotation="vertical", fontsize= 7)
plt.xlabel("Cities")
plt.ylabel("Sum of Public Transportation")
plt.tight_layout()
plt.savefig("Matplotlib_resources/transportationbycitybar.png")
plt.show()

<IPython.core.display.Javascript object>

In [11]:
# Plot bar graph of train stations by city
plt.figure("Number of Train Stations by City")
plt.title("Number of Train Stations by City")
x_axis = np.arange(len(public_transportation_df))
tick_locations = [value for value in x_axis]
plt.bar(x_axis, public_transportation_df["train_station"], color="blue", alpha=0.5, align="center")
plt.xticks(tick_locations, public_transportation_df["CITY"], rotation="vertical", fontsize= 7)
plt.xlabel("Cities")
plt.ylabel("Number of Train Stations")
plt.tight_layout()
plt.savefig("Matplotlib_resources/trainsbar.png")
plt.show()

<IPython.core.display.Javascript object>

In [10]:
plt.figure("Number of Subway Stations by City")
plt.title("Number of Subway Stations by City")
x_axis = np.arange(len(public_transportation_df))
tick_locations = [value for value in x_axis]
plt.bar(x_axis, public_transportation_df["subway_station"], color="green", alpha=0.5, align="center")
plt.xticks(tick_locations, public_transportation_df["CITY"], rotation="vertical", fontsize= 7)
plt.xlabel("Cities")
plt.ylabel("Number of Subway Stations")
plt.savefig("Matplotlib_resources/subwaybar.png")
plt.show()

<IPython.core.display.Javascript object>

In [13]:
plt.figure("Number of Airports by City")
plt.title("Number of Airports by City")
x_axis = np.arange(len(public_transportation_df))
tick_locations = [value for value in x_axis]
plt.bar(x_axis, public_transportation_df["airport"], color="purple", alpha=0.5, align="center")
plt.xticks(tick_locations, public_transportation_df["CITY"], rotation="vertical", fontsize= 7)
plt.xlabel("Cities")
plt.ylabel("Number of Airports")
plt.tight_layout()
plt.savefig("Matplotlib_resources/airportbar.png")
plt.show()

<IPython.core.display.Javascript object>

In [14]:
plt.figure("Number of Taxi Stands by City")
plt.title("Number of Taxi Stands by City")
x_axis = np.arange(len(public_transportation_df))
tick_locations = [value for value in x_axis]
plt.bar(x_axis, public_transportation_df["taxi_stand"], color="gray", alpha=0.5, align="center")
plt.xticks(tick_locations, public_transportation_df["CITY"], rotation="vertical")
plt.xlabel("Cities")
plt.ylabel("Number of Taxi Stands")
plt.tight_layout()
plt.savefig("Matplotlib_resources/taxibar.png")
plt.show()

<IPython.core.display.Javascript object>