## Read data from part 2 from csv

In [4]:
!conda install -c conda-forge geopy --yes # uncomment this line if you haven't completed the Foursquare API lab

Solving environment: done


  current version: 4.5.11
  latest version: 4.8.2

Please update conda by running

    $ conda update -n base -c defaults conda



## Package Plan ##

  environment location: /home/jupyterlab/conda/envs/python

  added / updated specs: 
    - geopy


The following packages will be downloaded:

    package                    |            build
    ---------------------------|-----------------
    certifi-2019.11.28         |           py36_0         149 KB  conda-forge
    scikit-learn-0.20.1        |   py36h22eb022_0         5.7 MB
    liblapack-3.8.0            |      11_openblas          10 KB  conda-forge
    numpy-1.18.1               |   py36h95a1406_0         5.2 MB  conda-forge
    liblapacke-3.8.0           |      11_openblas          10 KB  conda-forge
    geographiclib-1.50         |             py_0          34 KB  conda-forge
    libopenblas-0.3.6          |       h5a2b251_2         7.7 MB
    scipy-1.4.1                |   py36h921218d_0        

In [5]:
import pandas as pd
import numpy as np

In [6]:
from geopy.geocoders import Nominatim # convert an address into latitude and longitude values

import requests # library to handle requests
from pandas.io.json import json_normalize # tranform JSON file into a pandas dataframe

# Matplotlib and associated plotting modules
import matplotlib.cm as cm
import matplotlib.colors as colors

# import k-means from clustering stage
from sklearn.cluster import KMeans

#!conda install -c conda-forge folium=0.5.0 --yes # uncomment this line if you haven't completed the Foursquare API lab
import folium # map rendering library

print('Libraries imported.')

Libraries imported.


In [7]:
df = pd.read_csv("week3-2.csv")

In [8]:
df

Unnamed: 0,PostalCode,Borough,Neighbourhood,Latitude,Longitude
0,M3A,North York,Parkwoods,43.753259,-79.329656
1,M4A,North York,Victoria Village,43.725882,-79.315572
2,M5A,Downtown Toronto,Harbourfront,43.654260,-79.360636
3,M6A,North York,"Lawrence Heights,Lawrence Manor,Lawrence Heigh...",43.718518,-79.464763
4,M7A,Downtown Toronto,Queen's Park,43.662301,-79.389494
...,...,...,...,...,...
98,M8X,Etobicoke,"The Kingsway,Montgomery Road,Old Mill North,Th...",43.653654,-79.506944
99,M4Y,Downtown Toronto,Church and Wellesley,43.665860,-79.383160
100,M7Y,East Toronto,Business Reply Mail Processing Centre 969 Eastern,43.662744,-79.321558
101,M8Y,Etobicoke,"Humber Bay,King's Mill Park,Kingsway Park Sout...",43.636258,-79.498509


## Explore Downtown Toronto

In [9]:
df_dt = df[df["Borough"] == "Downtown Toronto"]
df_dt = df_dt.reset_index(drop=True)
df_dt

Unnamed: 0,PostalCode,Borough,Neighbourhood,Latitude,Longitude
0,M5A,Downtown Toronto,Harbourfront,43.65426,-79.360636
1,M7A,Downtown Toronto,Queen's Park,43.662301,-79.389494
2,M5B,Downtown Toronto,"Ryerson,Garden District,Ryerson,Garden Distric...",43.657162,-79.378937
3,M5C,Downtown Toronto,St. James Town,43.651494,-79.375418
4,M5E,Downtown Toronto,Berczy Park,43.644771,-79.373306
5,M5G,Downtown Toronto,Central Bay Street,43.657952,-79.387383
6,M6G,Downtown Toronto,Christie,43.669542,-79.422564
7,M5H,Downtown Toronto,"Adelaide,King,Richmond,Adelaide,King,Richmond,...",43.650571,-79.384568
8,M5J,Downtown Toronto,"Harbourfront East,Toronto Islands,Union Statio...",43.640816,-79.381752
9,M5K,Downtown Toronto,"Design Exchange,Toronto Dominion Centre,Design...",43.647177,-79.381576


## map of the neighborhoods in downtown toronto

In [10]:
address = 'Downtown Toronto'

geolocator = Nominatim(user_agent="dt_explorer")
location = geolocator.geocode(address)
latitude = location.latitude
longitude = location.longitude
print('The geograpical coordinate of Downtown Toronto are {}, {}.'.format(latitude, longitude))

The geograpical coordinate of Downtown Toronto are 43.6541737, -79.38081164513409.


In [11]:
# create map of Manhattan using latitude and longitude values
map_dt = folium.Map(location=[latitude, longitude], zoom_start=11)

# add markers to map
for lat, lng, label in zip(df_dt['Latitude'], df_dt['Longitude'], df_dt['PostalCode']):
    label = folium.Popup(label, parse_html=True)
    folium.CircleMarker(
        [lat, lng],
        radius=5,
        popup=label,
        color='blue',
        fill=True,
        fill_color='#3186cc',
        fill_opacity=0.7,
        parse_html=False).add_to(map_dt)  
    
map_dt

## foursquare info

In [45]:
CLIENT_ID = 'deleted' # your Foursquare ID
CLIENT_SECRET = 'deleted' # your Foursquare Secret
VERSION = '20200212' # Foursquare API version

print('Your credentails:')
print('CLIENT_ID: ' + CLIENT_ID)
print('CLIENT_SECRET:' + CLIENT_SECRET)

Your credentails:
CLIENT_ID: deleted
CLIENT_SECRET:deleted


## loop through all neighborhoods (PostalCodes)

#### useful functions, get from example jupyter notebook

In [13]:
def get_category_type(row):
    try:
        categories_list = row['categories']
    except:
        categories_list = row['venue.categories']
        
    if len(categories_list) == 0:
        return None
    else:
        return categories_list[0]['name']

In [14]:
def getNearbyVenues(names, latitudes, longitudes, radius=500):
    
    venues_list=[]
    for name, lat, lng in zip(names, latitudes, longitudes):
            
        # create the API request URL
        url = 'https://api.foursquare.com/v2/venues/explore?&client_id={}&client_secret={}&v={}&ll={},{}&radius={}&limit={}'.format(
            CLIENT_ID, 
            CLIENT_SECRET, 
            VERSION, 
            lat, 
            lng, 
            radius, 
            LIMIT)
            
        # make the GET request
        results = requests.get(url).json()["response"]['groups'][0]['items']
        
        # return only relevant information for each nearby venue
        venues_list.append([(
            name, 
            lat, 
            lng, 
            v['venue']['name'], 
            v['venue']['location']['lat'], 
            v['venue']['location']['lng'],  
            v['venue']['categories'][0]['name']) for v in results])

    nearby_venues = pd.DataFrame([item for venue_list in venues_list for item in venue_list])
    nearby_venues.columns = ['PostalCode', 
                  'Neighborhood Latitude', 
                  'Neighborhood Longitude', 
                  'Venue', 
                  'Venue Latitude', 
                  'Venue Longitude', 
                  'Venue Category']
    
    return(nearby_venues)

In [15]:
neighborhood_latitude = df_dt['Latitude'][0] # neighborhood latitude value
neighborhood_longitude = df_dt['Longitude'][0] # neighborhood longitude value

neighborhood_name = df_dt['PostalCode'][0] # neighborhood name

print('Latitude and longitude values of {} are {}, {}.'.format(neighborhood_name, 
                                                               neighborhood_latitude, 
                                                               neighborhood_longitude))
LIMIT = 100 # limit of number of venues returned by Foursquare API

radius = 500 # define radius

# create URL
url = 'https://api.foursquare.com/v2/venues/explore?&client_id={}&client_secret={}&v={}&ll={},{}&radius={}&limit={}'.format(
    CLIENT_ID, 
    CLIENT_SECRET, 
    VERSION, 
    neighborhood_latitude, 
    neighborhood_longitude, 
    radius, 
    LIMIT)
results = requests.get(url).json()
venues = results['response']['groups'][0]['items']


Latitude and longitude values of M5A are 43.6542599, -79.3606359.


In [16]:
    
nearby_venues = json_normalize(venues) # flatten JSON

# filter columns
filtered_columns = ['venue.name', 'venue.categories', 'venue.location.lat', 'venue.location.lng']
nearby_venues =nearby_venues.loc[:, filtered_columns]

# filter the category for each row
nearby_venues['venue.categories'] = nearby_venues.apply(get_category_type, axis=1)

# clean columns
nearby_venues.columns = [col.split(".")[-1] for col in nearby_venues.columns]


dt_venues = getNearbyVenues(names=df_dt['PostalCode'],
                                latitudes=df_dt['Latitude'],
                                longitudes=df_dt['Longitude']
                                )


In [17]:
dt_venues

Unnamed: 0,PostalCode,Neighborhood Latitude,Neighborhood Longitude,Venue,Venue Latitude,Venue Longitude,Venue Category
0,M5A,43.65426,-79.360636,Roselle Desserts,43.653447,-79.362017,Bakery
1,M5A,43.65426,-79.360636,Tandem Coffee,43.653559,-79.361809,Coffee Shop
2,M5A,43.65426,-79.360636,Cooper Koo Family YMCA,43.653191,-79.357947,Gym / Fitness Center
3,M5A,43.65426,-79.360636,Body Blitz Spa East,43.654735,-79.359874,Spa
4,M5A,43.65426,-79.360636,Morning Glory Cafe,43.653947,-79.361149,Breakfast Spot
...,...,...,...,...,...,...,...
1301,M4Y,43.66586,-79.383160,Noah's Natural Foods,43.668532,-79.385885,Food & Drink Shop
1302,M4Y,43.66586,-79.383160,Flash,43.664319,-79.380190,Strip Club
1303,M4Y,43.66586,-79.383160,Croissant Tree,43.669575,-79.382331,Coffee Shop
1304,M4Y,43.66586,-79.383160,Currie Hall,43.664801,-79.379565,Dance Studio


In [18]:
dt_venues.groupby('PostalCode').count()

Unnamed: 0_level_0,Neighborhood Latitude,Neighborhood Longitude,Venue,Venue Latitude,Venue Longitude,Venue Category
PostalCode,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
M4W,4,4,4,4,4,4
M4X,44,44,44,44,44,44
M4Y,83,83,83,83,83,83
M5A,47,47,47,47,47,47
M5B,100,100,100,100,100,100
M5C,100,100,100,100,100,100
M5E,56,56,56,56,56,56
M5G,85,85,85,85,85,85
M5H,100,100,100,100,100,100
M5J,100,100,100,100,100,100


In [19]:
print('There are {} uniques categories in Downtown Toronto.'.format(len(dt_venues['Venue Category'].unique())))

There are 200 uniques categories in Downtown Toronto.


## analyze venues in the Downtown Toronto 

In [20]:
# one hot encoding
dt_onehot = pd.get_dummies(dt_venues[['Venue Category']], prefix="", prefix_sep="")

# add neighborhood column back to dataframe
dt_onehot['PostalCode'] = dt_venues['PostalCode'] 

# move neighborhood column to the first column
fixed_columns = [dt_onehot.columns[-1]] + list(dt_onehot.columns[:-1])
dt_onehot = dt_onehot[fixed_columns]

dt_onehot.head()

Unnamed: 0,PostalCode,Afghan Restaurant,Airport,Airport Food Court,Airport Lounge,Airport Service,Airport Terminal,American Restaurant,Antique Shop,Aquarium,...,Toy / Game Store,Trail,Train Station,Vegetarian / Vegan Restaurant,Video Game Store,Vietnamese Restaurant,Wine Bar,Wings Joint,Women's Store,Yoga Studio
0,M5A,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
1,M5A,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
2,M5A,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
3,M5A,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
4,M5A,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0


In [21]:
dt_onehot.shape

(1306, 201)

In [22]:
dt_grouped = dt_onehot.groupby('PostalCode').mean().reset_index()
dt_grouped

Unnamed: 0,PostalCode,Afghan Restaurant,Airport,Airport Food Court,Airport Lounge,Airport Service,Airport Terminal,American Restaurant,Antique Shop,Aquarium,...,Toy / Game Store,Trail,Train Station,Vegetarian / Vegan Restaurant,Video Game Store,Vietnamese Restaurant,Wine Bar,Wings Joint,Women's Store,Yoga Studio
0,M4W,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.25,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,M4X,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,M4Y,0.012048,0.0,0.0,0.0,0.0,0.0,0.012048,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.012048,0.0,0.012048,0.0,0.012048
3,M5A,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.021277,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.021277
4,M5B,0.0,0.0,0.0,0.0,0.0,0.0,0.01,0.0,0.0,...,0.01,0.0,0.0,0.0,0.01,0.01,0.01,0.0,0.0,0.0
5,M5C,0.0,0.0,0.0,0.0,0.0,0.0,0.03,0.0,0.0,...,0.0,0.0,0.0,0.01,0.0,0.0,0.01,0.0,0.0,0.0
6,M5E,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.017857,0.0,0.0,0.0,0.0,0.0,0.0
7,M5G,0.0,0.0,0.0,0.0,0.0,0.0,0.011765,0.0,0.0,...,0.0,0.0,0.0,0.011765,0.0,0.0,0.011765,0.0,0.0,0.011765
8,M5H,0.0,0.0,0.0,0.0,0.0,0.0,0.02,0.0,0.0,...,0.0,0.0,0.0,0.02,0.0,0.0,0.01,0.0,0.01,0.0
9,M5J,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.05,...,0.0,0.0,0.01,0.01,0.0,0.0,0.01,0.0,0.0,0.0


## Top 5 in each PostalCode Neighbourhood

In [23]:
num_top_venues = 5

for hood in dt_grouped['PostalCode']:
    print("----"+hood+"----")
    temp = dt_grouped[dt_grouped['PostalCode'] == hood].T.reset_index()
    temp.columns = ['venue','freq']
    temp = temp.iloc[1:]
    temp['freq'] = temp['freq'].astype(float)
    temp = temp.round({'freq': 2})
    print(temp.sort_values('freq', ascending=False).reset_index(drop=True).head(num_top_venues))
    print('\n')

----M4W----
               venue  freq
0               Park  0.50
1         Playground  0.25
2              Trail  0.25
3  Afghan Restaurant  0.00
4       Neighborhood  0.00


----M4X----
                venue  freq
0                Café  0.07
1         Coffee Shop  0.07
2         Pizza Place  0.05
3              Bakery  0.05
4  Italian Restaurant  0.05


----M4Y----
                 venue  freq
0          Coffee Shop  0.07
1              Gay Bar  0.05
2     Sushi Restaurant  0.05
3  Japanese Restaurant  0.05
4           Restaurant  0.04


----M5A----
         venue  freq
0  Coffee Shop  0.17
1         Café  0.06
2          Pub  0.06
3       Bakery  0.06
4         Park  0.06


----M5B----
                 venue  freq
0          Coffee Shop  0.09
1       Clothing Store  0.07
2       Cosmetics Shop  0.03
3                 Café  0.03
4  Japanese Restaurant  0.03


----M5C----
                venue  freq
0                Café  0.06
1         Coffee Shop  0.05
2          Restaurant  0.05
3 

## input the data to pandas dataframe

### top 10 most common venues in the neighborhoods of Downtown Toronto

In [24]:
def return_most_common_venues(row, num_top_venues):
    row_categories = row.iloc[1:]
    row_categories_sorted = row_categories.sort_values(ascending=False)
    
    return row_categories_sorted.index.values[0:num_top_venues]

In [25]:
num_top_venues = 10

indicators = ['st', 'nd', 'rd']

# create columns according to number of top venues
columns = ['PostalCode']
for ind in np.arange(num_top_venues):
    try:
        columns.append('{}{} Most Common Venue'.format(ind+1, indicators[ind]))
    except:
        columns.append('{}th Most Common Venue'.format(ind+1))

# create a new dataframe
neighborhoods_venues_sorted = pd.DataFrame(columns=columns)
neighborhoods_venues_sorted['PostalCode'] = dt_grouped['PostalCode']

for ind in np.arange(dt_grouped.shape[0]):
    neighborhoods_venues_sorted.iloc[ind, 1:] = return_most_common_venues(dt_grouped.iloc[ind, :], num_top_venues)

neighborhoods_venues_sorted.head()

Unnamed: 0,PostalCode,1st Most Common Venue,2nd Most Common Venue,3rd Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,M4W,Park,Playground,Trail,Deli / Bodega,Eastern European Restaurant,Dumpling Restaurant,Donut Shop,Doner Restaurant,Dog Run,Discount Store
1,M4X,Coffee Shop,Café,Italian Restaurant,Bakery,Pizza Place,Pub,Restaurant,Breakfast Spot,Jewelry Store,Sandwich Place
2,M4Y,Coffee Shop,Gay Bar,Sushi Restaurant,Japanese Restaurant,Restaurant,Gastropub,Fast Food Restaurant,Pub,Gym,Dance Studio
3,M5A,Coffee Shop,Park,Pub,Café,Bakery,Theater,Breakfast Spot,Restaurant,Mexican Restaurant,Event Space
4,M5B,Coffee Shop,Clothing Store,Japanese Restaurant,Café,Cosmetics Shop,Electronics Store,Lingerie Store,Italian Restaurant,Middle Eastern Restaurant,Ice Cream Shop


## Clustering Analysis

In [27]:
# set number of clusters
kclusters = 5

dt_grouped_clustering = dt_grouped.drop('PostalCode', 1)

# run k-means clustering
kmeans = KMeans(n_clusters=kclusters, random_state=0).fit(dt_grouped_clustering)

# check cluster labels generated for each row in the dataframe
kmeans.labels_[0:10] 

array([2, 1, 1, 4, 1, 1, 1, 4, 1, 1], dtype=int32)

In [28]:
# add clustering labels
neighborhoods_venues_sorted.insert(0, 'Cluster Labels', kmeans.labels_)

dt_merged = df_dt

# merge toronto_grouped with toronto_data to add latitude/longitude for each neighborhood
dt_merged = dt_merged.join(neighborhoods_venues_sorted.set_index('PostalCode'), on='PostalCode')

dt_merged.head() # check the last columns!

Unnamed: 0,PostalCode,Borough,Neighbourhood,Latitude,Longitude,Cluster Labels,1st Most Common Venue,2nd Most Common Venue,3rd Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,M5A,Downtown Toronto,Harbourfront,43.65426,-79.360636,4,Coffee Shop,Park,Pub,Café,Bakery,Theater,Breakfast Spot,Restaurant,Mexican Restaurant,Event Space
1,M7A,Downtown Toronto,Queen's Park,43.662301,-79.389494,4,Coffee Shop,Gym,Park,Yoga Studio,College Auditorium,Sandwich Place,Salad Place,Restaurant,Burger Joint,Portuguese Restaurant
2,M5B,Downtown Toronto,"Ryerson,Garden District,Ryerson,Garden Distric...",43.657162,-79.378937,1,Coffee Shop,Clothing Store,Japanese Restaurant,Café,Cosmetics Shop,Electronics Store,Lingerie Store,Italian Restaurant,Middle Eastern Restaurant,Ice Cream Shop
3,M5C,Downtown Toronto,St. James Town,43.651494,-79.375418,1,Café,Restaurant,Coffee Shop,Italian Restaurant,Cocktail Bar,Hotel,Breakfast Spot,Beer Bar,Bakery,Clothing Store
4,M5E,Downtown Toronto,Berczy Park,43.644771,-79.373306,1,Coffee Shop,Bakery,Beer Bar,Café,Steakhouse,Farmers Market,Cheese Shop,Cocktail Bar,Seafood Restaurant,Basketball Stadium


## Visualize the results

In [30]:
# create map
map_clusters = folium.Map(location=[latitude, longitude], zoom_start=11)

# set color scheme for the clusters
x = np.arange(kclusters)
ys = [i + x + (i*x)**2 for i in range(kclusters)]
colors_array = cm.rainbow(np.linspace(0, 1, len(ys)))
rainbow = [colors.rgb2hex(i) for i in colors_array]

# add markers to the map
markers_colors = []
for lat, lon, poi, cluster in zip(dt_merged['Latitude'], dt_merged['Longitude'], dt_merged['Neighbourhood'], dt_merged['Cluster Labels']):
    label = folium.Popup(str(poi) + ' Cluster ' + str(cluster), parse_html=True)
    folium.CircleMarker(
        [lat, lon],
        radius=5,
        popup=label,
        color=rainbow[cluster-1],
        fill=True,
        fill_color=rainbow[cluster-1],
        fill_opacity=0.7).add_to(map_clusters)
       
map_clusters

In [40]:
dt_merged.loc[dt_merged['Cluster Labels'] == 0, dt_merged.columns[[2] + list(range(5, dt_merged.shape[1]))]]

Unnamed: 0,Neighbourhood,Cluster Labels,1st Most Common Venue,2nd Most Common Venue,3rd Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
6,Christie,0,Grocery Store,Café,Coffee Shop,Park,Candy Store,Diner,Gas Station,Athletics & Sports,Nightclub,Baby Store


In [41]:
dt_merged.loc[dt_merged['Cluster Labels'] == 1, dt_merged.columns[[2] + list(range(5, dt_merged.shape[1]))]]

Unnamed: 0,Neighbourhood,Cluster Labels,1st Most Common Venue,2nd Most Common Venue,3rd Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
2,"Ryerson,Garden District,Ryerson,Garden Distric...",1,Coffee Shop,Clothing Store,Japanese Restaurant,Café,Cosmetics Shop,Electronics Store,Lingerie Store,Italian Restaurant,Middle Eastern Restaurant,Ice Cream Shop
3,St. James Town,1,Café,Restaurant,Coffee Shop,Italian Restaurant,Cocktail Bar,Hotel,Breakfast Spot,Beer Bar,Bakery,Clothing Store
4,Berczy Park,1,Coffee Shop,Bakery,Beer Bar,Café,Steakhouse,Farmers Market,Cheese Shop,Cocktail Bar,Seafood Restaurant,Basketball Stadium
7,"Adelaide,King,Richmond,Adelaide,King,Richmond,...",1,Coffee Shop,Bar,Steakhouse,Café,Thai Restaurant,Burger Joint,Bakery,Restaurant,Cosmetics Shop,Asian Restaurant
8,"Harbourfront East,Toronto Islands,Union Statio...",1,Coffee Shop,Aquarium,Café,Hotel,Italian Restaurant,Sporting Goods Shop,Scenic Lookout,Fried Chicken Joint,Brewery,Restaurant
9,"Design Exchange,Toronto Dominion Centre,Design...",1,Coffee Shop,Café,Hotel,Restaurant,Italian Restaurant,Bar,Steakhouse,Deli / Bodega,Seafood Restaurant,Gastropub
10,"Commerce Court,Victoria Hotel,Commerce Court,V...",1,Coffee Shop,Café,Hotel,Restaurant,Italian Restaurant,Gym,Deli / Bodega,Gastropub,American Restaurant,Seafood Restaurant
11,"Harbord,University of Toronto,Harbord,Universi...",1,Café,Restaurant,Bookstore,Japanese Restaurant,Bar,Bakery,Chinese Restaurant,Sandwich Place,Pub,Poutine Place
12,"Chinatown,Grange Park,Kensington Market,Chinat...",1,Bar,Café,Dumpling Restaurant,Vietnamese Restaurant,Coffee Shop,Vegetarian / Vegan Restaurant,Mexican Restaurant,Bakery,Chinese Restaurant,Farmers Market
15,Stn A PO Boxes 25 The Esplanade,1,Coffee Shop,Café,Hotel,Restaurant,Seafood Restaurant,Beer Bar,Japanese Restaurant,Italian Restaurant,Lounge,Bakery


In [42]:
dt_merged.loc[dt_merged['Cluster Labels'] == 2, dt_merged.columns[[2] + list(range(5, dt_merged.shape[1]))]]

Unnamed: 0,Neighbourhood,Cluster Labels,1st Most Common Venue,2nd Most Common Venue,3rd Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
14,Rosedale,2,Park,Playground,Trail,Deli / Bodega,Eastern European Restaurant,Dumpling Restaurant,Donut Shop,Doner Restaurant,Dog Run,Discount Store


In [43]:
dt_merged.loc[dt_merged['Cluster Labels'] == 3, dt_merged.columns[[2] + list(range(5, dt_merged.shape[1]))]]

Unnamed: 0,Neighbourhood,Cluster Labels,1st Most Common Venue,2nd Most Common Venue,3rd Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
13,"CN Tower,Bathurst Quay,Island airport,Harbourf...",3,Airport Lounge,Airport Service,Airport Terminal,Harbor / Marina,Sculpture Garden,Boat or Ferry,Rental Car Location,Bar,Boutique,Airport


In [44]:
dt_merged.loc[dt_merged['Cluster Labels'] == 4, dt_merged.columns[[2] + list(range(5, dt_merged.shape[1]))]]

Unnamed: 0,Neighbourhood,Cluster Labels,1st Most Common Venue,2nd Most Common Venue,3rd Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,Harbourfront,4,Coffee Shop,Park,Pub,Café,Bakery,Theater,Breakfast Spot,Restaurant,Mexican Restaurant,Event Space
1,Queen's Park,4,Coffee Shop,Gym,Park,Yoga Studio,College Auditorium,Sandwich Place,Salad Place,Restaurant,Burger Joint,Portuguese Restaurant
5,Central Bay Street,4,Coffee Shop,Café,Italian Restaurant,Sandwich Place,Juice Bar,Burger Joint,Ice Cream Shop,Japanese Restaurant,Chinese Restaurant,Department Store
