# In this notebook, I have worked on North York,East York and York data

#### All the three have 5 neighbourhoods,so each cluster contains only one neighbourhood

In [195]:
import pandas as pd # library for data analysis
import numpy as np


## Scrapping using pandas libraray

In [196]:
#data=pd.read_html("https://en.wikipedia.org/wiki/List_of_postal_codes_of_Canada:_M")
#datas=data[0]
#data1=pd.DataFrame(datas)
#data1.head()

#### Scrapping a web page is not legal always.Lets check the status code.

In [197]:
import requests # library to handle requests
url="https://en.wikipedia.org/wiki/List_of_postal_codes_of_Canada:_M"
response=requests.get(url)
print(response.status_code) 

200


#### As the status code is 200,we have permission to scrap the page

## Scrapping using BeautifulSoup library

In [198]:
from bs4 import BeautifulSoup # library to parse HTML documents
soup=BeautifulSoup(response.text,'html.parser')
t=soup.find('table',{'class':"wikitable"})
t1=pd.read_html(str(t))
df=pd.DataFrame(t1[0])
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
df.head()

Unnamed: 0,Postal Code,Borough,Neighbourhood
0,M1A,Not assigned,Not assigned
1,M2A,Not assigned,Not assigned
2,M3A,North York,Parkwoods
3,M4A,North York,Victoria Village
4,M5A,Downtown Toronto,"Regent Park, Harbourfront"


In [199]:
df.rename(columns={'Neighbourhood':'Neighbourhood_Name'},inplace=True)

In [200]:
df['Borough'].value_counts()

Not assigned        77
North York          24
Downtown Toronto    19
Scarborough         17
Etobicoke           12
Central Toronto      9
West Toronto         6
East York            5
York                 5
East Toronto         5
Mississauga          1
Name: Borough, dtype: int64

In [201]:
df['Neighbourhood_Name'].value_counts().head()

Not assigned                     77
Downsview                         4
Don Mills                         2
High Park, The Junction South     1
The Danforth West, Riverdale      1
Name: Neighbourhood_Name, dtype: int64

In [202]:
index_numbers=df[df['Borough']=='Not assigned'].index

In [203]:
n=df.iloc[index_numbers]
n

Unnamed: 0,Postal Code,Borough,Neighbourhood_Name
0,M1A,Not assigned,Not assigned
1,M2A,Not assigned,Not assigned
7,M8A,Not assigned,Not assigned
10,M2B,Not assigned,Not assigned
15,M7B,Not assigned,Not assigned
16,M8B,Not assigned,Not assigned
19,M2C,Not assigned,Not assigned
24,M7C,Not assigned,Not assigned
25,M8C,Not assigned,Not assigned
28,M2E,Not assigned,Not assigned


In [204]:
n['Neighbourhood_Name'].value_counts()

Not assigned    77
Name: Neighbourhood_Name, dtype: int64

In [205]:
df.drop(index_numbers,inplace=True)
df.head()

Unnamed: 0,Postal Code,Borough,Neighbourhood_Name
2,M3A,North York,Parkwoods
3,M4A,North York,Victoria Village
4,M5A,Downtown Toronto,"Regent Park, Harbourfront"
5,M6A,North York,"Lawrence Manor, Lawrence Heights"
6,M7A,Downtown Toronto,"Queen's Park, Ontario Provincial Government"


## DataFrame after cleaning 

In [206]:
df.index=np.arange(0,len(df))
df.head()

Unnamed: 0,Postal Code,Borough,Neighbourhood_Name
0,M3A,North York,Parkwoods
1,M4A,North York,Victoria Village
2,M5A,Downtown Toronto,"Regent Park, Harbourfront"
3,M6A,North York,"Lawrence Manor, Lawrence Heights"
4,M7A,Downtown Toronto,"Queen's Park, Ontario Provincial Government"


In [207]:
df.shape

(103, 3)

In [210]:
!pip install geopy # installing geopy



In [212]:
from geopy.geocoders import Nominatim # convert an address into latitude and longitude values
address='Toronto'
geolocator=Nominatim(user_agent='t_explorer')
location=geolocator.geocode(address)
latitude=location.latitude
longitude = location.longitude
print('The geograpical coordinate of Toronto are {}, {}.'.format(latitude, longitude))

The geograpical coordinate of Toronto are 43.6534817, -79.3839347.


## Extracting data through the link

In [213]:
import io
url="https://cocl.us/Geospatial_data"
response=requests.get(url).text
ll_data=pd.read_csv(io.StringIO(response))
ll_data.head()

Unnamed: 0,Postal Code,Latitude,Longitude
0,M1B,43.806686,-79.194353
1,M1C,43.784535,-79.160497
2,M1E,43.763573,-79.188711
3,M1G,43.770992,-79.216917
4,M1H,43.773136,-79.239476


## Merging ll_data with toronto_df on Postal Code 

In [214]:
toronto_df=pd.merge(df,ll_data,on='Postal Code')
toronto_df.head()

Unnamed: 0,Postal Code,Borough,Neighbourhood_Name,Latitude,Longitude
0,M3A,North York,Parkwoods,43.753259,-79.329656
1,M4A,North York,Victoria Village,43.725882,-79.315572
2,M5A,Downtown Toronto,"Regent Park, Harbourfront",43.65426,-79.360636
3,M6A,North York,"Lawrence Manor, Lawrence Heights",43.718518,-79.464763
4,M7A,Downtown Toronto,"Queen's Park, Ontario Provincial Government",43.662301,-79.389494


In [215]:
print("There are {} boroughs and {} neighbourhoods".format(len(toronto_df['Borough'].unique()),toronto_df.shape[0]))

There are 10 boroughs and 103 neighbourhoods


In [217]:
def data(b):
    data = toronto_df[toronto_df['Borough'] == b].reset_index(drop=True)
    return(data.head())

# Working on North York data

In [218]:
NY_data=data('North York')
NY_data

Unnamed: 0,Postal Code,Borough,Neighbourhood_Name,Latitude,Longitude
0,M3A,North York,Parkwoods,43.753259,-79.329656
1,M4A,North York,Victoria Village,43.725882,-79.315572
2,M6A,North York,"Lawrence Manor, Lawrence Heights",43.718518,-79.464763
3,M3B,North York,Don Mills,43.745906,-79.352188
4,M6B,North York,Glencairn,43.709577,-79.445073


In [122]:
neigh=NY_data.loc[0,'Neighbourhood_Name']
n=(NY_data['Neighbourhood_Name']==neigh)
neigh_lat = NY_data.loc[n,'Latitude'].values
neigh_long = NY_data.loc[n,'Longitude'].values
print('The latitude & longitude of {} are : {} & {}'.format(neigh,neigh_lat[0],neigh_long[0]))

The latitude & longitude of Parkwoods are : 43.7532586 & -79.3296565


#### Information to access FourSquare API

In [302]:
CLIENT_ID = 'ID' # your Foursquare ID
CLIENT_SECRET = 'SECRET' # your Foursquare Secret
VERSION = 'VERSION' # Foursquare API version
LIMIT = 100 # A default Foursquare API limit value
RADIUS = 1000
print('Your credentails:')
print('CLIENT_ID: ' + CLIENT_ID)
print('CLIENT_SECRET:' + CLIENT_SECRET)

Your credentails:
CLIENT_ID: ID
CLIENT_SECRET:SECRET


## Getting venues in North York using FourSquare

In [220]:
url='https://api.foursquare.com/v2/venues/explore?/&client_id={}&client_secret={}&v={}&ll={},{}&radius={}&limit={}'.format(CLIENT_ID, CLIENT_SECRET,
                                                                                                                               VERSION,neigh_lat[0],neigh_long[0],RADIUS,LIMIT)
results=requests.get(url).json()
results

{'meta': {'code': 200, 'requestId': '6010e493f1d69f48c78b13c9'},
 'response': {'suggestedFilters': {'header': 'Tap to show:',
   'filters': [{'name': 'Open now', 'key': 'openNow'}]},
  'headerLocation': 'Parkwoods - Donalda',
  'headerFullLocation': 'Parkwoods - Donalda, Toronto',
  'headerLocationGranularity': 'neighborhood',
  'totalResults': 29,
  'suggestedBounds': {'ne': {'lat': 43.762258609000014,
    'lng': -79.31721997969855},
   'sw': {'lat': 43.74425859099999, 'lng': -79.34209302030145}},
  'groups': [{'type': 'Recommended Places',
    'name': 'recommended',
    'items': [{'reasons': {'count': 0,
       'items': [{'summary': 'This spot is popular',
         'type': 'general',
         'reasonName': 'globalInteractionReason'}]},
      'venue': {'id': '4b8991cbf964a520814232e3',
       'name': "Allwyn's Bakery",
       'location': {'address': '81 Underhill drive',
        'lat': 43.75984035203157,
        'lng': -79.32471879917513,
        'labeledLatLngs': [{'label': 'display'

In [221]:
from pandas.io.json import json_normalize # tranform JSON file into a pandas dataframe
Parkwoods_venues_list = results['response']['groups'][0]['items']
Parkwoods_venues = json_normalize(Parkwoods_venues_list)
required_columns = ['venue.name','venue.categories','venue.location.lat','venue.location.lng']
Parkwoods_venues = Parkwoods_venues.loc[:,required_columns]
v = Parkwoods_venues['venue.categories'].values
Parkwoods_venues.columns = ['PVenue_Name','Category','PVenue_Latitude','Parkwoods_Longitude']
Parkwoods_venues.head()     


  This is separate from the ipykernel package so we can avoid doing imports until


Unnamed: 0,PVenue_Name,Category,PVenue_Latitude,Parkwoods_Longitude
0,Allwyn's Bakery,"[{'id': '4bf58dd8d48988d144941735', 'name': 'C...",43.75984,-79.324719
1,Tim Hortons,"[{'id': '4bf58dd8d48988d16d941735', 'name': 'C...",43.760668,-79.326368
2,Brookbanks Park,"[{'id': '4bf58dd8d48988d163941735', 'name': 'P...",43.751976,-79.33214
3,Bruno's valu-mart,"[{'id': '4bf58dd8d48988d118951735', 'name': 'G...",43.746143,-79.32463
4,High Street Fish & Chips,"[{'id': '4edd64a0c7ddd24ca188df1a', 'name': 'F...",43.74526,-79.324949


In [222]:
for i in range(0,len(Parkwoods_venues)):
    c=v[i][0]['name']
    print(c)
    Parkwoods_venues.loc[i,'PVenue_Category']=c

Caribbean Restaurant
Café
Park
Grocery Store
Fish & Chips Shop
Fast Food Restaurant
Pharmacy
Supermarket
Pharmacy
Pizza Place
Food & Drink Shop
Intersection
Bus Stop
Bus Stop
Park
Train Station
Discount Store
Laundry Service
ATM
Chinese Restaurant
Coffee Shop
Convenience Store
Shopping Mall
Skating Rink
Tennis Court
Park
Cosmetics Shop
Shop & Service
Shopping Mall


In [223]:
Parkwoods_venues.head()

Unnamed: 0,PVenue_Name,Category,PVenue_Latitude,Parkwoods_Longitude,PVenue_Category
0,Allwyn's Bakery,"[{'id': '4bf58dd8d48988d144941735', 'name': 'C...",43.75984,-79.324719,Caribbean Restaurant
1,Tim Hortons,"[{'id': '4bf58dd8d48988d16d941735', 'name': 'C...",43.760668,-79.326368,Café
2,Brookbanks Park,"[{'id': '4bf58dd8d48988d163941735', 'name': 'P...",43.751976,-79.33214,Park
3,Bruno's valu-mart,"[{'id': '4bf58dd8d48988d118951735', 'name': 'G...",43.746143,-79.32463,Grocery Store
4,High Street Fish & Chips,"[{'id': '4edd64a0c7ddd24ca188df1a', 'name': 'F...",43.74526,-79.324949,Fish & Chips Shop


#### Venues of Parkwoods

In [224]:
Parkwoods_venues.drop(['Category'],inplace=True,axis=1)
Parkwoods_venues.head()

Unnamed: 0,PVenue_Name,PVenue_Latitude,Parkwoods_Longitude,PVenue_Category
0,Allwyn's Bakery,43.75984,-79.324719,Caribbean Restaurant
1,Tim Hortons,43.760668,-79.326368,Café
2,Brookbanks Park,43.751976,-79.33214,Park
3,Bruno's valu-mart,43.746143,-79.32463,Grocery Store
4,High Street Fish & Chips,43.74526,-79.324949,Fish & Chips Shop


## Getting venues of all the neighbourhoods in North York

In [225]:
def neigh_explore(borough_data):
    print('The below dataframe contains venues of the neighbourhoods in {}'.format(borough_data.loc[0,'Borough']))
    venues_list=[]
    for i in range(0,len(borough_data)):
        borough_neigh = borough_data.loc[i,'Neighbourhood_Name']
        n = (borough_data['Neighbourhood_Name'] == borough_neigh)
        borough_neigh_lat = borough_data.loc[n,'Latitude'].values
        borough_neigh_long = borough_data.loc[n,'Longitude'].values
        #print('The latitude & longitude of {} are : {} & {}'.format(borough_neigh,borough_neigh_lat[0],borough_neigh_long[0]))
        url = 'https://api.foursquare.com/v2/venues/explore?/&client_id={}&client_secret={}&v={}&ll={},{}&radius={}&limit={}'.format(CLIENT_ID, CLIENT_SECRET,
                                                                                                            VERSION,borough_neigh_lat[0],borough_neigh_long[0],RADIUS,LIMIT)
        result=requests.get(url).json()['response']['groups'][0]['items']
        venues_list.append([(borough_neigh,borough_neigh_lat[0],borough_neigh_long[0],
                            v['venue']['name'],
                            v['venue']['categories'][0]['name'],
                            v['venue']['location']['lat'],
                            v['venue']['location']['lng']) for v in result])
 #   for venue in venues_list:
  #      for item in venue:
   #         nearby_venues = pd.DataFrame(item)
    nearby_venues = pd.DataFrame([item for venue in venues_list for item in venue])
    nearby_venues.columns = ['Neighbourhood_Name','Neighbourhood_Lat','Neighbourhood_Lng','Venue_Name','Venue_Category','Venue_Lat','Venue_Lng']
    return(nearby_venues)

In [226]:
NORTHYORK_NEIGH_VENUES=neigh_explore(NY_data)
NORTHYORK_NEIGH_VENUES.head()

The below dataframe contains venues of the neighbourhoods in North York


Unnamed: 0,Neighbourhood_Name,Neighbourhood_Lat,Neighbourhood_Lng,Venue_Name,Venue_Category,Venue_Lat,Venue_Lng
0,Parkwoods,43.753259,-79.329656,Allwyn's Bakery,Caribbean Restaurant,43.75984,-79.324719
1,Parkwoods,43.753259,-79.329656,Tim Hortons,Café,43.760668,-79.326368
2,Parkwoods,43.753259,-79.329656,Brookbanks Park,Park,43.751976,-79.33214
3,Parkwoods,43.753259,-79.329656,Bruno's valu-mart,Grocery Store,43.746143,-79.32463
4,Parkwoods,43.753259,-79.329656,High Street Fish & Chips,Fish & Chips Shop,43.74526,-79.324949


## One Hot encoding Venue Category

In [227]:
def onehot(neigh_venues_df):
    neigh_venues_onehot = pd.get_dummies(neigh_venues_df[['Venue_Category']],prefix="",prefix_sep="")
    neigh_venues_onehot['Neighbourhood_Name'] = neigh_venues_df['Neighbourhood_Name']
    columns = [neigh_venues_onehot.columns[-1]] + list(neigh_venues_onehot.columns[:-1])
    neigh_venues_onehot = neigh_venues_onehot[columns]
    return neigh_venues_onehot
    

In [228]:
NORTHYORK_NEIGH_VENUES_ONEHOT = onehot(NORTHYORK_NEIGH_VENUES)
NORTHYORK_NEIGH_VENUES_ONEHOT.head()


Unnamed: 0,Neighbourhood_Name,ATM,Accessories Store,Asian Restaurant,Athletics & Sports,Bakery,Bank,Bar,Boutique,Bowling Alley,Breakfast Spot,Burger Joint,Bus Stop,Cafeteria,Café,Caribbean Restaurant,Cheese Shop,Chinese Restaurant,Clothing Store,Coffee Shop,Convenience Store,Cosmetics Shop,Dessert Shop,Diner,Discount Store,Electronics Store,Event Space,Fast Food Restaurant,Fireworks Store,Fish & Chips Shop,Flower Shop,Food & Drink Shop,Fried Chicken Joint,Furniture / Home Store,Gas Station,Golf Course,Greek Restaurant,Grocery Store,Gym,Gym / Fitness Center,Hockey Arena,Ice Cream Shop,Intersection,Italian Restaurant,Japanese Restaurant,Korean Restaurant,Latin American Restaurant,Laundry Service,Liquor Store,Lounge,Mediterranean Restaurant,Men's Store,Miscellaneous Shop,Mobile Phone Shop,Paper / Office Supplies Store,Park,Pet Store,Pharmacy,Photography Lab,Pizza Place,Playground,Portuguese Restaurant,Pub,Restaurant,Salad Place,Sandwich Place,Seafood Restaurant,Shop & Service,Shopping Mall,Skating Rink,Sporting Goods Shop,Supermarket,Sushi Restaurant,Tennis Court,Thai Restaurant,Train Station,Video Game Store,Vietnamese Restaurant,Women's Store
0,Parkwoods,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
1,Parkwoods,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2,Parkwoods,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
3,Parkwoods,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
4,Parkwoods,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


## Grouping on Neighbourhoods

In [229]:
def group(neigh_onehot_df):
    neigh_group_df = neigh_onehot_df.groupby('Neighbourhood_Name').mean().reset_index()
    return neigh_group_df

In [230]:
NORTHYORK_NEIGH_VENUES_GROUP = group(NORTHYORK_NEIGH_VENUES_ONEHOT)
NORTHYORK_NEIGH_VENUES_GROUP.head()

Unnamed: 0,Neighbourhood_Name,ATM,Accessories Store,Asian Restaurant,Athletics & Sports,Bakery,Bank,Bar,Boutique,Bowling Alley,Breakfast Spot,Burger Joint,Bus Stop,Cafeteria,Café,Caribbean Restaurant,Cheese Shop,Chinese Restaurant,Clothing Store,Coffee Shop,Convenience Store,Cosmetics Shop,Dessert Shop,Diner,Discount Store,Electronics Store,Event Space,Fast Food Restaurant,Fireworks Store,Fish & Chips Shop,Flower Shop,Food & Drink Shop,Fried Chicken Joint,Furniture / Home Store,Gas Station,Golf Course,Greek Restaurant,Grocery Store,Gym,Gym / Fitness Center,Hockey Arena,Ice Cream Shop,Intersection,Italian Restaurant,Japanese Restaurant,Korean Restaurant,Latin American Restaurant,Laundry Service,Liquor Store,Lounge,Mediterranean Restaurant,Men's Store,Miscellaneous Shop,Mobile Phone Shop,Paper / Office Supplies Store,Park,Pet Store,Pharmacy,Photography Lab,Pizza Place,Playground,Portuguese Restaurant,Pub,Restaurant,Salad Place,Sandwich Place,Seafood Restaurant,Shop & Service,Shopping Mall,Skating Rink,Sporting Goods Shop,Supermarket,Sushi Restaurant,Tennis Court,Thai Restaurant,Train Station,Video Game Store,Vietnamese Restaurant,Women's Store
0,Don Mills,0.0,0.0,0.033333,0.0,0.0,0.033333,0.033333,0.0,0.0,0.033333,0.066667,0.0,0.033333,0.033333,0.033333,0.0,0.0,0.0,0.133333,0.0,0.0,0.0,0.033333,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.033333,0.0,0.033333,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.0,0.0,0.033333,0.0,0.0,0.0,0.0,0.033333,0.033333,0.0,0.0,0.0,0.0,0.066667,0.0,0.0,0.0,0.033333,0.033333,0.033333,0.0,0.0,0.0,0.0,0.0,0.033333,0.0,0.0,0.033333,0.0,0.033333,0.0,0.0
1,Glencairn,0.0,0.0,0.0,0.0,0.032258,0.032258,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.064516,0.032258,0.0,0.0,0.0,0.0,0.032258,0.0,0.096774,0.0,0.0,0.032258,0.0,0.0,0.0,0.064516,0.0,0.0,0.129032,0.032258,0.0,0.0,0.032258,0.0,0.032258,0.032258,0.0,0.032258,0.0,0.0,0.0,0.032258,0.0,0.0,0.0,0.0,0.064516,0.032258,0.032258,0.032258,0.064516,0.032258,0.0,0.032258,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,"Lawrence Manor, Lawrence Heights",0.0,0.019608,0.0,0.039216,0.0,0.019608,0.0,0.019608,0.019608,0.0,0.0,0.0,0.0,0.0,0.0,0.019608,0.0,0.098039,0.058824,0.0,0.0,0.039216,0.0,0.019608,0.0,0.019608,0.058824,0.019608,0.0,0.0,0.0,0.039216,0.058824,0.0,0.0,0.019608,0.019608,0.0,0.019608,0.0,0.0,0.0,0.019608,0.0,0.019608,0.0,0.0,0.0,0.0,0.0,0.019608,0.019608,0.0,0.019608,0.019608,0.019608,0.0,0.0,0.0,0.019608,0.0,0.0,0.058824,0.0,0.019608,0.019608,0.0,0.0,0.0,0.0,0.0,0.039216,0.0,0.0,0.0,0.0,0.058824,0.039216
3,Parkwoods,0.034483,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.068966,0.0,0.034483,0.034483,0.0,0.034483,0.0,0.034483,0.034483,0.034483,0.0,0.0,0.034483,0.0,0.0,0.034483,0.0,0.034483,0.0,0.034483,0.0,0.0,0.0,0.0,0.0,0.034483,0.0,0.0,0.0,0.0,0.034483,0.0,0.0,0.0,0.0,0.034483,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.103448,0.0,0.068966,0.0,0.034483,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.034483,0.068966,0.034483,0.0,0.034483,0.0,0.034483,0.0,0.034483,0.0,0.0,0.0
4,Victoria Village,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.0,0.0,0.1,0.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [265]:
def display_top_venues(group_df):
    top_venues = 5
    for name in group_df['Neighbourhood_Name']:
        print("----"+name+"----")
        temp = group_df[group_df['Neighbourhood_Name'] == name].T.reset_index()
        temp.columns = ['venue','freq']
        temp = temp.iloc[1:]
        temp['freq'] = temp['freq'].astype(float)
        temp = temp.round({'freq': 2})
        print(temp.sort_values('freq', ascending=False).reset_index(drop=True).head(top_venues))
        print('\n')
    return

    

In [266]:
NORTHYORK_NEIGH_TOP_VENUES = display_top_venues(NORTHYORK_NEIGH_VENUES_GROUP)

----Don Mills----
                 venue  freq
0          Coffee Shop  0.13
1  Japanese Restaurant  0.10
2          Pizza Place  0.07
3         Burger Joint  0.07
4                Diner  0.03


----Glencairn----
                  venue  freq
0         Grocery Store  0.13
1  Fast Food Restaurant  0.10
2                  Park  0.06
3           Pizza Place  0.06
4           Gas Station  0.06


----Lawrence Manor, Lawrence Heights----
                   venue  freq
0         Clothing Store  0.10
1   Fast Food Restaurant  0.06
2  Vietnamese Restaurant  0.06
3             Restaurant  0.06
4            Coffee Shop  0.06


----Parkwoods----
           venue  freq
0           Park  0.10
1       Pharmacy  0.07
2       Bus Stop  0.07
3  Shopping Mall  0.07
4            ATM  0.03


----Victoria Village----
                   venue  freq
0            Coffee Shop   0.2
1           Hockey Arena   0.1
2    Sporting Goods Shop   0.1
3  Portuguese Restaurant   0.1
4            Men's Store   0.1




In [234]:
def top_venues_df(row,top_venues):
    row_cat = row.iloc[1:]
    row_sort = row_cat.sort_values(ascending=False)
    return row_sort.index.values[0:top_venues]

In [235]:
def df(group_df):
    top_venues = 10
    columns = ['Neighbourhood_Name']
    for i in np.arange(top_venues):
        columns.append('{}th Most Common Venue'.format(i+1))
    neigh_sorted = pd.DataFrame(columns=columns)
    neigh_sorted['Neighbourhood_Name'] = group_df['Neighbourhood_Name']
    for r in np.arange(group_df.shape[0]):
        neigh_sorted.iloc[r,1:] = top_venues_df(group_df.iloc[r,:], top_venues)
    return neigh_sorted

#### DataFrame of top 10 venues in various neighbourhoods

In [236]:
NORTHYORK_NEIGH_VENUES_SORTED = df(NORTHYORK_NEIGH_VENUES_GROUP)
NORTHYORK_NEIGH_VENUES_SORTED.head()

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,Don Mills,Coffee Shop,Japanese Restaurant,Pizza Place,Burger Joint,Caribbean Restaurant,Sandwich Place,Diner,Mobile Phone Shop,Paper / Office Supplies Store,Café
1,Glencairn,Grocery Store,Fast Food Restaurant,Park,Coffee Shop,Pizza Place,Gas Station,Gym,Ice Cream Shop,Electronics Store,Italian Restaurant
2,"Lawrence Manor, Lawrence Heights",Clothing Store,Vietnamese Restaurant,Coffee Shop,Furniture / Home Store,Fast Food Restaurant,Restaurant,Women's Store,Athletics & Sports,Sushi Restaurant,Dessert Shop
3,Parkwoods,Park,Bus Stop,Pharmacy,Shopping Mall,ATM,Caribbean Restaurant,Chinese Restaurant,Coffee Shop,Convenience Store,Cosmetics Shop
4,Victoria Village,Coffee Shop,Gym / Fitness Center,Sporting Goods Shop,Hockey Arena,Lounge,Men's Store,Pizza Place,Portuguese Restaurant,Golf Course,Boutique


## Clustering and generating labels

In [237]:
def cluster(group_df,k):
    neigh_clustering = group_df.drop('Neighbourhood_Name', 1)
    kmeans = KMeans(n_clusters=k, random_state=0).fit(neigh_clustering)
    print("Generated labels")
    return kmeans.labels_

In [238]:
cluster(NORTHYORK_NEIGH_VENUES_GROUP,5)

Generated labels


array([2, 1, 3, 4, 0])

## Adding the latitude and longitude columns to the sorted dataframe

In [239]:
def merge(borough_df,neigh_sorted):
    neigh_sorted.insert(0,'Cluster_Labels',kmeans.labels_)
    neigh_merged = borough_df
    neigh_merged = neigh_merged.join(neigh_sorted.set_index('Neighbourhood_Name'), on='Neighbourhood_Name')
    return neigh_merged

In [240]:
NORTHYORK_NEIGH_MERGED = merge(NY_data,NORTHYORK_NEIGH_VENUES_SORTED)
NORTHYORK_NEIGH_MERGED.head()

Unnamed: 0,Postal Code,Borough,Neighbourhood_Name,Latitude,Longitude,Cluster_Labels,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,M3A,North York,Parkwoods,43.753259,-79.329656,4,Park,Bus Stop,Pharmacy,Shopping Mall,ATM,Caribbean Restaurant,Chinese Restaurant,Coffee Shop,Convenience Store,Cosmetics Shop
1,M4A,North York,Victoria Village,43.725882,-79.315572,0,Coffee Shop,Gym / Fitness Center,Sporting Goods Shop,Hockey Arena,Lounge,Men's Store,Pizza Place,Portuguese Restaurant,Golf Course,Boutique
2,M6A,North York,"Lawrence Manor, Lawrence Heights",43.718518,-79.464763,3,Clothing Store,Vietnamese Restaurant,Coffee Shop,Furniture / Home Store,Fast Food Restaurant,Restaurant,Women's Store,Athletics & Sports,Sushi Restaurant,Dessert Shop
3,M3B,North York,Don Mills,43.745906,-79.352188,2,Coffee Shop,Japanese Restaurant,Pizza Place,Burger Joint,Caribbean Restaurant,Sandwich Place,Diner,Mobile Phone Shop,Paper / Office Supplies Store,Café
4,M6B,North York,Glencairn,43.709577,-79.445073,1,Grocery Store,Fast Food Restaurant,Park,Coffee Shop,Pizza Place,Gas Station,Gym,Ice Cream Shop,Electronics Store,Italian Restaurant


In [241]:
#!pip install folium # to install folium 
import folium # map rendering library
import matplotlib.cm as cm
import matplotlib.colors as colors

In [242]:
def map(neigh_merge,k):
    map_clusters = folium.Map(location=[latitude, longitude], zoom_start=11)
    # set color scheme for the clusters
    x = np.arange(k)
    ys = [i + x + (i*x)**2 for i in range(k)]
    colors_array = cm.rainbow(np.linspace(0, 1, len(ys)))
    rainbow = [colors.rgb2hex(i) for i in colors_array]

    # add markers to the map
    markers_colors = []
    for lat, lon, poi, cluster in zip(neigh_merge['Latitude'], neigh_merge['Longitude'], neigh_merge['Neighbourhood_Name'],neigh_merge['Cluster_Labels']):
        label = folium.Popup(str(poi) + ' Cluster ' + str(cluster), parse_html=True)
        folium.CircleMarker(
          [lat, lon],
          radius=5,
          popup=label,
          color=rainbow[cluster-1],
          fill=True,
          fill_color=rainbow[cluster-1],
          fill_opacity=0.7).add_to(map_clusters)
       
    return map_clusters

In [243]:
map(NORTHYORK_NEIGH_MERGED,5)

## Examining Clusters

In [244]:
NORTHYORK_NEIGH_MERGED.loc[NORTHYORK_NEIGH_MERGED['Cluster_Labels'] == 0, NORTHYORK_NEIGH_MERGED.columns[[2] + list(range(6, NORTHYORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
1,Victoria Village,Coffee Shop,Gym / Fitness Center,Sporting Goods Shop,Hockey Arena,Lounge,Men's Store,Pizza Place,Portuguese Restaurant,Golf Course,Boutique


In [245]:
NORTHYORK_NEIGH_MERGED.loc[NORTHYORK_NEIGH_MERGED['Cluster_Labels'] == 1, NORTHYORK_NEIGH_MERGED.columns[[2] + list(range(6, NORTHYORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
4,Glencairn,Grocery Store,Fast Food Restaurant,Park,Coffee Shop,Pizza Place,Gas Station,Gym,Ice Cream Shop,Electronics Store,Italian Restaurant


In [246]:
NORTHYORK_NEIGH_MERGED.loc[NORTHYORK_NEIGH_MERGED['Cluster_Labels'] == 2, NORTHYORK_NEIGH_MERGED.columns[[2] + list(range(6, NORTHYORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
3,Don Mills,Coffee Shop,Japanese Restaurant,Pizza Place,Burger Joint,Caribbean Restaurant,Sandwich Place,Diner,Mobile Phone Shop,Paper / Office Supplies Store,Café


In [247]:
NORTHYORK_NEIGH_MERGED.loc[NORTHYORK_NEIGH_MERGED['Cluster_Labels'] == 3, NORTHYORK_NEIGH_MERGED.columns[[2] + list(range(6, NORTHYORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
2,"Lawrence Manor, Lawrence Heights",Clothing Store,Vietnamese Restaurant,Coffee Shop,Furniture / Home Store,Fast Food Restaurant,Restaurant,Women's Store,Athletics & Sports,Sushi Restaurant,Dessert Shop


In [248]:
NORTHYORK_NEIGH_MERGED.loc[NORTHYORK_NEIGH_MERGED['Cluster_Labels'] == 4, NORTHYORK_NEIGH_MERGED.columns[[2] + list(range(6, NORTHYORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,Parkwoods,Park,Bus Stop,Pharmacy,Shopping Mall,ATM,Caribbean Restaurant,Chinese Restaurant,Coffee Shop,Convenience Store,Cosmetics Shop


In [250]:
toronto_df['Borough'].unique()

array(['North York', 'Downtown Toronto', 'Etobicoke', 'Scarborough',
       'East York', 'York', 'East Toronto', 'West Toronto',
       'Central Toronto', 'Mississauga'], dtype=object)

# Working on East York

In [251]:
EY_data=data('East York')
EY_data

Unnamed: 0,Postal Code,Borough,Neighbourhood_Name,Latitude,Longitude
0,M4B,East York,"Parkview Hill, Woodbine Gardens",43.706397,-79.309937
1,M4C,East York,Woodbine Heights,43.695344,-79.318389
2,M4G,East York,Leaside,43.70906,-79.363452
3,M4H,East York,Thorncliffe Park,43.705369,-79.349372
4,M4J,East York,"East Toronto, Broadview North (Old East York)",43.685347,-79.338106


In [252]:
EASTYORK_NEIGH_VENUES=neigh_explore(EY_data)
EASTYORK_NEIGH_VENUES.head()

The below dataframe contains venues of the neighbourhoods in East York


Unnamed: 0,Neighbourhood_Name,Neighbourhood_Lat,Neighbourhood_Lng,Venue_Name,Venue_Category,Venue_Lat,Venue_Lng
0,"Parkview Hill, Woodbine Gardens",43.706397,-79.309937,Jawny Bakers,Gastropub,43.705783,-79.312913
1,"Parkview Hill, Woodbine Gardens",43.706397,-79.309937,Toronto Climbing Academy,Rock Climbing Spot,43.709362,-79.315006
2,"Parkview Hill, Woodbine Gardens",43.706397,-79.309937,East York Gymnastics,Gym / Fitness Center,43.710654,-79.309279
3,"Parkview Hill, Woodbine Gardens",43.706397,-79.309937,Muddy York Brewing Co.,Brewery,43.712362,-79.312019
4,"Parkview Hill, Woodbine Gardens",43.706397,-79.309937,Peek Freans Cookie Outlet,Bakery,43.71326,-79.308063


In [253]:
EASTYORK_NEIGH_VENUES_ONEHOT = onehot(EASTYORK_NEIGH_VENUES)
EASTYORK_NEIGH_VENUES_ONEHOT.head()

Unnamed: 0,Neighbourhood_Name,Afghan Restaurant,American Restaurant,Asian Restaurant,Athletics & Sports,Auto Dealership,BBQ Joint,Bagel Shop,Bakery,Bank,Bar,Beer Bar,Beer Store,Bike Shop,Bookstore,Breakfast Spot,Brewery,Bridge,Burger Joint,Burrito Place,Bus Line,Bus Station,Bus Stop,Business Service,Café,Cheese Shop,Chinese Restaurant,Coffee Shop,Construction & Landscaping,Convenience Store,Curling Ice,Department Store,Dessert Shop,Dim Sum Restaurant,Diner,Discount Store,Donut Shop,Electronics Store,Ethiopian Restaurant,Farmers Market,Fast Food Restaurant,Fish & Chips Shop,Flea Market,Flower Shop,Frame Store,Fried Chicken Joint,Furniture / Home Store,Gas Station,Gastropub,Gourmet Shop,Greek Restaurant,Grocery Store,Gym,Gym / Fitness Center,Hostel,Hotel,Ice Cream Shop,Indian Restaurant,Intersection,Italian Restaurant,Japanese Restaurant,Karaoke Bar,Liquor Store,Metro Station,Mexican Restaurant,Middle Eastern Restaurant,Mobile Phone Shop,Nail Salon,Paper / Office Supplies Store,Park,Pastry Shop,Performing Arts Venue,Pet Store,Pharmacy,Pizza Place,Pool,Pub,Ramen Restaurant,Rental Car Location,Restaurant,Rock Climbing Spot,Sandwich Place,Shopping Mall,Skating Rink,Smoothie Shop,Soccer Stadium,Souvlaki Shop,Spa,Sporting Goods Shop,Sports Bar,Supermarket,Sushi Restaurant,Thai Restaurant,Turkish Restaurant,Vietnamese Restaurant,Warehouse Store,Wine Shop,Yoga Studio
0,"Parkview Hill, Woodbine Gardens",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
1,"Parkview Hill, Woodbine Gardens",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2,"Parkview Hill, Woodbine Gardens",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
3,"Parkview Hill, Woodbine Gardens",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
4,"Parkview Hill, Woodbine Gardens",0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [269]:
EASTYORK_NEIGH_VENUES_GROUP = group(EASTYORK_NEIGH_VENUES_ONEHOT)
EASTYORK_NEIGH_VENUES_GROUP.head()

Unnamed: 0,Neighbourhood_Name,Afghan Restaurant,American Restaurant,Asian Restaurant,Athletics & Sports,Auto Dealership,BBQ Joint,Bagel Shop,Bakery,Bank,Bar,Beer Bar,Beer Store,Bike Shop,Bookstore,Breakfast Spot,Brewery,Bridge,Burger Joint,Burrito Place,Bus Line,Bus Station,Bus Stop,Business Service,Café,Cheese Shop,Chinese Restaurant,Coffee Shop,Construction & Landscaping,Convenience Store,Curling Ice,Department Store,Dessert Shop,Dim Sum Restaurant,Diner,Discount Store,Donut Shop,Electronics Store,Ethiopian Restaurant,Farmers Market,Fast Food Restaurant,Fish & Chips Shop,Flea Market,Flower Shop,Frame Store,Fried Chicken Joint,Furniture / Home Store,Gas Station,Gastropub,Gourmet Shop,Greek Restaurant,Grocery Store,Gym,Gym / Fitness Center,Hostel,Hotel,Ice Cream Shop,Indian Restaurant,Intersection,Italian Restaurant,Japanese Restaurant,Karaoke Bar,Liquor Store,Metro Station,Mexican Restaurant,Middle Eastern Restaurant,Mobile Phone Shop,Nail Salon,Paper / Office Supplies Store,Park,Pastry Shop,Performing Arts Venue,Pet Store,Pharmacy,Pizza Place,Pool,Pub,Ramen Restaurant,Rental Car Location,Restaurant,Rock Climbing Spot,Sandwich Place,Shopping Mall,Skating Rink,Smoothie Shop,Soccer Stadium,Souvlaki Shop,Spa,Sporting Goods Shop,Sports Bar,Supermarket,Sushi Restaurant,Thai Restaurant,Turkish Restaurant,Vietnamese Restaurant,Warehouse Store,Wine Shop,Yoga Studio
0,"East Toronto, Broadview North (Old East York)",0.0,0.021053,0.010526,0.0,0.0,0.010526,0.0,0.021053,0.021053,0.010526,0.031579,0.010526,0.0,0.010526,0.021053,0.0,0.0,0.010526,0.010526,0.010526,0.010526,0.0,0.010526,0.073684,0.010526,0.010526,0.073684,0.0,0.021053,0.0,0.0,0.010526,0.010526,0.010526,0.010526,0.010526,0.0,0.031579,0.010526,0.031579,0.010526,0.0,0.010526,0.010526,0.0,0.0,0.0,0.021053,0.010526,0.063158,0.010526,0.010526,0.0,0.010526,0.0,0.0,0.010526,0.0,0.010526,0.0,0.010526,0.0,0.010526,0.010526,0.010526,0.0,0.010526,0.0,0.010526,0.010526,0.010526,0.010526,0.021053,0.031579,0.0,0.010526,0.010526,0.010526,0.010526,0.0,0.021053,0.0,0.0,0.0,0.0,0.010526,0.010526,0.0,0.010526,0.0,0.0,0.010526,0.010526,0.010526,0.0,0.010526,0.0
1,Leaside,0.0,0.0,0.0,0.0,0.016393,0.016393,0.016393,0.016393,0.032787,0.0,0.0,0.016393,0.016393,0.0,0.016393,0.032787,0.0,0.032787,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.065574,0.0,0.016393,0.016393,0.032787,0.016393,0.0,0.0,0.0,0.0,0.04918,0.0,0.0,0.0,0.016393,0.0,0.0,0.0,0.0,0.04918,0.0,0.0,0.0,0.0,0.04918,0.0,0.0,0.0,0.0,0.0,0.016393,0.016393,0.016393,0.016393,0.0,0.016393,0.0,0.016393,0.016393,0.016393,0.0,0.016393,0.0,0.0,0.016393,0.016393,0.0,0.016393,0.016393,0.0,0.0,0.016393,0.032787,0.0,0.032787,0.016393,0.016393,0.016393,0.0,0.0,0.0,0.065574,0.032787,0.016393,0.016393,0.0,0.0,0.0,0.0,0.0,0.0
2,"Parkview Hill, Woodbine Gardens",0.0,0.0,0.0,0.052632,0.0,0.0,0.0,0.052632,0.052632,0.0,0.0,0.0,0.0,0.0,0.0,0.105263,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.052632,0.052632,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.052632,0.0,0.052632,0.0,0.0,0.0,0.0,0.0,0.052632,0.0,0.0,0.0,0.0,0.052632,0.0,0.0,0.0,0.0,0.052632,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.052632,0.052632,0.157895,0.0,0.0,0.0,0.0,0.0,0.052632,0.0,0.0,0.0,0.0,0.052632,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
3,Thorncliffe Park,0.040816,0.0,0.0,0.020408,0.0,0.020408,0.0,0.0,0.020408,0.0,0.0,0.020408,0.0,0.0,0.0,0.040816,0.020408,0.040816,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.102041,0.0,0.0,0.0,0.0,0.020408,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.020408,0.0,0.0,0.0,0.0,0.020408,0.020408,0.020408,0.0,0.0,0.0,0.061224,0.020408,0.0,0.0,0.020408,0.0,0.061224,0.0,0.020408,0.0,0.0,0.0,0.0,0.0,0.040816,0.0,0.0,0.0,0.020408,0.0,0.020408,0.0,0.020408,0.040816,0.0,0.0,0.0,0.0,0.020408,0.0,0.020408,0.040816,0.020408,0.020408,0.0,0.0,0.0,0.0,0.0,0.040816,0.0,0.0,0.040816,0.0,0.020408,0.0,0.020408
4,Woodbine Heights,0.0,0.0,0.0,0.076923,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.038462,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.038462,0.0,0.076923,0.0,0.0,0.115385,0.0,0.038462,0.038462,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.038462,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.038462,0.0,0.0,0.0,0.0,0.0,0.038462,0.0,0.0,0.0,0.0,0.0,0.0,0.076923,0.038462,0.0,0.0,0.0,0.076923,0.0,0.038462,0.0,0.0,0.0,0.0,0.076923,0.0,0.076923,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.076923,0.0,0.0,0.0,0.0,0.0


In [267]:
EASTYORK_NEIGH_TOP_VENUES = display_top_venues(EASTYORK_NEIGH_VENUES_GROUP)

----East Toronto, Broadview North (Old East York)----
                  venue  freq
0                  Café  0.07
1           Coffee Shop  0.07
2      Greek Restaurant  0.06
3           Pizza Place  0.03
4  Ethiopian Restaurant  0.03


----Leaside----
                    venue  freq
0             Coffee Shop  0.07
1     Sporting Goods Shop  0.07
2       Electronics Store  0.05
3           Grocery Store  0.05
4  Furniture / Home Store  0.05


----Parkview Hill, Woodbine Gardens----
          venue  freq
0   Pizza Place  0.16
1       Brewery  0.11
2   Coffee Shop  0.05
3  Intersection  0.05
4     Gastropub  0.05


----Thorncliffe Park----
               venue  freq
0        Coffee Shop  0.10
1      Grocery Store  0.06
2  Indian Restaurant  0.06
3        Pizza Place  0.04
4       Burger Joint  0.04


----Woodbine Heights----
             venue  freq
0      Coffee Shop  0.12
1  Thai Restaurant  0.08
2     Skating Rink  0.08
3      Pizza Place  0.08
4             Park  0.08




In [270]:
EASTYORK_NEIGH_VENUES_SORTED = df(EASTYORK_NEIGH_VENUES_GROUP)
EASTYORK_NEIGH_VENUES_SORTED.head()

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,"East Toronto, Broadview North (Old East York)",Café,Coffee Shop,Greek Restaurant,Ethiopian Restaurant,Fast Food Restaurant,Pizza Place,Beer Bar,American Restaurant,Bakery,Bank
1,Leaside,Coffee Shop,Sporting Goods Shop,Grocery Store,Electronics Store,Furniture / Home Store,Sandwich Place,Burger Joint,Sports Bar,Department Store,Brewery
2,"Parkview Hill, Woodbine Gardens",Pizza Place,Brewery,Coffee Shop,Bank,Rock Climbing Spot,Pharmacy,Pet Store,Soccer Stadium,Gym / Fitness Center,Intersection
3,Thorncliffe Park,Coffee Shop,Indian Restaurant,Grocery Store,Afghan Restaurant,Middle Eastern Restaurant,Pizza Place,Turkish Restaurant,Supermarket,Brewery,Burger Joint
4,Woodbine Heights,Coffee Shop,Sandwich Place,Skating Rink,Park,Pizza Place,Café,Thai Restaurant,Athletics & Sports,Convenience Store,Bus Stop


In [271]:
cluster(EASTYORK_NEIGH_VENUES_GROUP,5)

Generated labels


array([3, 1, 2, 4, 0])

In [273]:
EASTYORK_NEIGH_MERGED = merge(EY_data,EASTYORK_NEIGH_VENUES_SORTED)
EASTYORK_NEIGH_MERGED.head()

Unnamed: 0,Postal Code,Borough,Neighbourhood_Name,Latitude,Longitude,Cluster_Labels,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,M4B,East York,"Parkview Hill, Woodbine Gardens",43.706397,-79.309937,3,Pizza Place,Brewery,Coffee Shop,Bank,Rock Climbing Spot,Pharmacy,Pet Store,Soccer Stadium,Gym / Fitness Center,Intersection
1,M4C,East York,Woodbine Heights,43.695344,-79.318389,0,Coffee Shop,Sandwich Place,Skating Rink,Park,Pizza Place,Café,Thai Restaurant,Athletics & Sports,Convenience Store,Bus Stop
2,M4G,East York,Leaside,43.70906,-79.363452,1,Coffee Shop,Sporting Goods Shop,Grocery Store,Electronics Store,Furniture / Home Store,Sandwich Place,Burger Joint,Sports Bar,Department Store,Brewery
3,M4H,East York,Thorncliffe Park,43.705369,-79.349372,4,Coffee Shop,Indian Restaurant,Grocery Store,Afghan Restaurant,Middle Eastern Restaurant,Pizza Place,Turkish Restaurant,Supermarket,Brewery,Burger Joint
4,M4J,East York,"East Toronto, Broadview North (Old East York)",43.685347,-79.338106,2,Café,Coffee Shop,Greek Restaurant,Ethiopian Restaurant,Fast Food Restaurant,Pizza Place,Beer Bar,American Restaurant,Bakery,Bank


In [276]:
map(EASTYORK_NEIGH_MERGED,5)

In [277]:
EASTYORK_NEIGH_MERGED.loc[EASTYORK_NEIGH_MERGED['Cluster_Labels'] == 0, EASTYORK_NEIGH_MERGED.columns[[2] + list(range(6, EASTYORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
1,Woodbine Heights,Coffee Shop,Sandwich Place,Skating Rink,Park,Pizza Place,Café,Thai Restaurant,Athletics & Sports,Convenience Store,Bus Stop


In [278]:
EASTYORK_NEIGH_MERGED.loc[EASTYORK_NEIGH_MERGED['Cluster_Labels'] == 1, EASTYORK_NEIGH_MERGED.columns[[2] + list(range(6, EASTYORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
2,Leaside,Coffee Shop,Sporting Goods Shop,Grocery Store,Electronics Store,Furniture / Home Store,Sandwich Place,Burger Joint,Sports Bar,Department Store,Brewery


In [279]:
EASTYORK_NEIGH_MERGED.loc[EASTYORK_NEIGH_MERGED['Cluster_Labels'] == 2, EASTYORK_NEIGH_MERGED.columns[[2] + list(range(6, EASTYORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
4,"East Toronto, Broadview North (Old East York)",Café,Coffee Shop,Greek Restaurant,Ethiopian Restaurant,Fast Food Restaurant,Pizza Place,Beer Bar,American Restaurant,Bakery,Bank


In [280]:
EASTYORK_NEIGH_MERGED.loc[EASTYORK_NEIGH_MERGED['Cluster_Labels'] == 3, EASTYORK_NEIGH_MERGED.columns[[2] + list(range(6, EASTYORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,"Parkview Hill, Woodbine Gardens",Pizza Place,Brewery,Coffee Shop,Bank,Rock Climbing Spot,Pharmacy,Pet Store,Soccer Stadium,Gym / Fitness Center,Intersection


In [281]:
EASTYORK_NEIGH_MERGED.loc[EASTYORK_NEIGH_MERGED['Cluster_Labels'] == 4, EASTYORK_NEIGH_MERGED.columns[[2] + list(range(6, EASTYORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
3,Thorncliffe Park,Coffee Shop,Indian Restaurant,Grocery Store,Afghan Restaurant,Middle Eastern Restaurant,Pizza Place,Turkish Restaurant,Supermarket,Brewery,Burger Joint


In [282]:
EASTYORK_NEIGH_MERGED.loc[EASTYORK_NEIGH_MERGED['Cluster_Labels'] == 5, EASTYORK_NEIGH_MERGED.columns[[2] + list(range(6, EASTYORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue


# Working on York data

In [284]:
Y_data=data('York')
Y_data

Unnamed: 0,Postal Code,Borough,Neighbourhood_Name,Latitude,Longitude
0,M6C,York,Humewood-Cedarvale,43.693781,-79.428191
1,M6E,York,Caledonia-Fairbanks,43.689026,-79.453512
2,M6M,York,"Del Ray, Mount Dennis, Keelsdale and Silverthorn",43.691116,-79.476013
3,M6N,York,"Runnymede, The Junction North",43.673185,-79.487262
4,M9N,York,Weston,43.706876,-79.518188


In [286]:
YORK_NEIGH_VENUES=neigh_explore(Y_data)
YORK_NEIGH_VENUES.head()

The below dataframe contains venues of the neighbourhoods in York


Unnamed: 0,Neighbourhood_Name,Neighbourhood_Lat,Neighbourhood_Lng,Venue_Name,Venue_Category,Venue_Lat,Venue_Lng
0,Humewood-Cedarvale,43.693781,-79.428191,Cedarvale Park,Field,43.692535,-79.428705
1,Humewood-Cedarvale,43.693781,-79.428191,Cedarvale Ravine,Trail,43.690188,-79.426106
2,Humewood-Cedarvale,43.693781,-79.428191,Starbucks,Coffee Shop,43.700598,-79.427433
3,Humewood-Cedarvale,43.693781,-79.428191,Jerusalem Restaurant,Middle Eastern Restaurant,43.700241,-79.428957
4,Humewood-Cedarvale,43.693781,-79.428191,St. Urbain Bagel,Bagel Shop,43.700646,-79.427059


In [287]:
YORK_NEIGH_VENUES_ONEHOT = onehot(YORK_NEIGH_VENUES)
YORK_NEIGH_VENUES_ONEHOT.head()

Unnamed: 0,Neighbourhood_Name,Asian Restaurant,Athletics & Sports,BBQ Joint,Bagel Shop,Bakery,Bank,Bar,Beer Store,Breakfast Spot,Brewery,Burger Joint,Bus Line,Bus Stop,Café,Coffee Shop,Convenience Store,Cosmetics Shop,Dance Studio,Deli / Bodega,Dessert Shop,Diner,Discount Store,Dive Bar,Falafel Restaurant,Fast Food Restaurant,Field,Food Truck,Fried Chicken Joint,Furniture / Home Store,Gas Station,Gastropub,Grocery Store,Gym,Gym / Fitness Center,Hockey Arena,Indian Restaurant,Intersection,Italian Restaurant,Japanese Restaurant,Jewelry Store,Korean Restaurant,Liquor Store,Metro Station,Mexican Restaurant,Middle Eastern Restaurant,Optical Shop,Park,Pharmacy,Pizza Place,Playground,Portuguese Restaurant,Restaurant,Sandwich Place,Shopping Mall,Skating Rink,Soccer Field,Soccer Stadium,Supermarket,Thai Restaurant,Trail,Train Station,Video Game Store,Video Store,Vietnamese Restaurant,Wine Shop,Women's Store
0,Humewood-Cedarvale,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
1,Humewood-Cedarvale,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0
2,Humewood-Cedarvale,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
3,Humewood-Cedarvale,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
4,Humewood-Cedarvale,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [288]:
YORK_NEIGH_VENUES_GROUP = group(YORK_NEIGH_VENUES_ONEHOT)
YORK_NEIGH_VENUES_GROUP.head()

Unnamed: 0,Neighbourhood_Name,Asian Restaurant,Athletics & Sports,BBQ Joint,Bagel Shop,Bakery,Bank,Bar,Beer Store,Breakfast Spot,Brewery,Burger Joint,Bus Line,Bus Stop,Café,Coffee Shop,Convenience Store,Cosmetics Shop,Dance Studio,Deli / Bodega,Dessert Shop,Diner,Discount Store,Dive Bar,Falafel Restaurant,Fast Food Restaurant,Field,Food Truck,Fried Chicken Joint,Furniture / Home Store,Gas Station,Gastropub,Grocery Store,Gym,Gym / Fitness Center,Hockey Arena,Indian Restaurant,Intersection,Italian Restaurant,Japanese Restaurant,Jewelry Store,Korean Restaurant,Liquor Store,Metro Station,Mexican Restaurant,Middle Eastern Restaurant,Optical Shop,Park,Pharmacy,Pizza Place,Playground,Portuguese Restaurant,Restaurant,Sandwich Place,Shopping Mall,Skating Rink,Soccer Field,Soccer Stadium,Supermarket,Thai Restaurant,Trail,Train Station,Video Game Store,Video Store,Vietnamese Restaurant,Wine Shop,Women's Store
0,Caledonia-Fairbanks,0.0,0.0,0.0,0.0,0.043478,0.043478,0.0,0.0,0.0,0.0,0.0,0.043478,0.086957,0.0,0.043478,0.0,0.043478,0.0,0.0,0.0,0.0,0.043478,0.0,0.043478,0.043478,0.0,0.043478,0.0,0.0,0.0,0.0,0.043478,0.043478,0.0,0.0,0.0,0.0,0.0,0.043478,0.0,0.0,0.0,0.0,0.043478,0.0,0.0,0.086957,0.086957,0.086957,0.0,0.043478,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.043478
1,"Del Ray, Mount Dennis, Keelsdale and Silverthorn",0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.066667,0.0,0.066667,0.0,0.0,0.066667,0.0,0.0,0.0,0.2,0.066667,0.0,0.133333,0.0,0.0,0.0,0.0,0.0,0.066667,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.066667,0.0,0.0,0.066667,0.066667,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.066667,0.0,0.066667,0.0
2,Humewood-Cedarvale,0.0,0.0,0.0,0.037037,0.0,0.037037,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.074074,0.074074,0.0,0.037037,0.037037,0.0,0.0,0.0,0.0,0.0,0.0,0.037037,0.0,0.0,0.0,0.0,0.037037,0.074074,0.0,0.0,0.037037,0.0,0.037037,0.037037,0.0,0.0,0.037037,0.0,0.037037,0.0,0.037037,0.037037,0.037037,0.037037,0.111111,0.0,0.0,0.0,0.037037,0.0,0.0,0.0,0.037037,0.0,0.0,0.037037,0.0,0.0,0.0,0.0,0.0,0.0
3,"Runnymede, The Junction North",0.022222,0.044444,0.022222,0.0,0.0,0.0,0.022222,0.044444,0.0,0.066667,0.022222,0.044444,0.0,0.022222,0.111111,0.044444,0.0,0.022222,0.0,0.0,0.0,0.022222,0.022222,0.0,0.022222,0.0,0.0,0.022222,0.022222,0.044444,0.0,0.0,0.0,0.022222,0.0,0.022222,0.0,0.0,0.0,0.0,0.0,0.022222,0.0,0.0,0.0,0.0,0.044444,0.022222,0.066667,0.0,0.0,0.0,0.044444,0.0,0.022222,0.0,0.0,0.022222,0.022222,0.0,0.0,0.022222,0.0,0.022222,0.0,0.0
4,Weston,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.071429,0.0,0.0,0.0,0.0,0.0,0.071429,0.0,0.0,0.0,0.0,0.0,0.071429,0.071429,0.0,0.0,0.0,0.0,0.0,0.071429,0.071429,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.071429,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.071429,0.071429,0.0,0.0,0.071429,0.0,0.0,0.071429,0.071429,0.0,0.0,0.0,0.0,0.142857,0.0,0.0,0.0,0.0,0.0


In [289]:
YORK_NEIGH_TOP_VENUES = display_top_venues(YORK_NEIGH_VENUES_GROUP)

----Caledonia-Fairbanks----
           venue  freq
0           Park  0.09
1       Pharmacy  0.09
2    Pizza Place  0.09
3       Bus Stop  0.09
4  Women's Store  0.04


----Del Ray, Mount Dennis, Keelsdale and Silverthorn----
                    venue  freq
0  Furniture / Home Store  0.20
1           Grocery Store  0.13
2             Gas Station  0.07
3            Dessert Shop  0.07
4              Playground  0.07


----Humewood-Cedarvale----
               venue  freq
0        Pizza Place  0.11
1  Convenience Store  0.07
2        Coffee Shop  0.07
3      Grocery Store  0.07
4  Korean Restaurant  0.04


----Runnymede, The Junction North----
         venue  freq
0  Coffee Shop  0.11
1      Brewery  0.07
2  Pizza Place  0.07
3     Bus Line  0.04
4         Park  0.04


----Weston----
                    venue  freq
0           Train Station  0.14
1     Fried Chicken Joint  0.07
2  Furniture / Home Store  0.07
3                   Diner  0.07
4                Pharmacy  0.07




In [290]:
YORK_NEIGH_VENUES_SORTED = df(YORK_NEIGH_VENUES_GROUP)
YORK_NEIGH_VENUES_SORTED.head()

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,Caledonia-Fairbanks,Pharmacy,Park,Bus Stop,Pizza Place,Fast Food Restaurant,Mexican Restaurant,Japanese Restaurant,Grocery Store,Food Truck,Women's Store
1,"Del Ray, Mount Dennis, Keelsdale and Silverthorn",Furniture / Home Store,Grocery Store,Gas Station,Shopping Mall,Dessert Shop,Playground,Discount Store,Sandwich Place,Italian Restaurant,Fast Food Restaurant
2,Humewood-Cedarvale,Pizza Place,Grocery Store,Convenience Store,Coffee Shop,Optical Shop,Gastropub,Deli / Bodega,Hockey Arena,Dance Studio,Intersection
3,"Runnymede, The Junction North",Coffee Shop,Pizza Place,Brewery,Park,Athletics & Sports,Gas Station,Beer Store,Sandwich Place,Bus Line,Convenience Store
4,Weston,Train Station,Pharmacy,Skating Rink,Discount Store,Diner,Jewelry Store,Coffee Shop,Furniture / Home Store,Pizza Place,Restaurant


In [291]:
cluster(YORK_NEIGH_VENUES_GROUP,5)

Generated labels


array([3, 1, 4, 2, 0])

In [292]:
YORK_NEIGH_MERGED = merge(Y_data,YORK_NEIGH_VENUES_SORTED)
YORK_NEIGH_MERGED.head()

Unnamed: 0,Postal Code,Borough,Neighbourhood_Name,Latitude,Longitude,Cluster_Labels,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,M6C,York,Humewood-Cedarvale,43.693781,-79.428191,3,Pizza Place,Grocery Store,Convenience Store,Coffee Shop,Optical Shop,Gastropub,Deli / Bodega,Hockey Arena,Dance Studio,Intersection
1,M6E,York,Caledonia-Fairbanks,43.689026,-79.453512,2,Pharmacy,Park,Bus Stop,Pizza Place,Fast Food Restaurant,Mexican Restaurant,Japanese Restaurant,Grocery Store,Food Truck,Women's Store
2,M6M,York,"Del Ray, Mount Dennis, Keelsdale and Silverthorn",43.691116,-79.476013,1,Furniture / Home Store,Grocery Store,Gas Station,Shopping Mall,Dessert Shop,Playground,Discount Store,Sandwich Place,Italian Restaurant,Fast Food Restaurant
3,M6N,York,"Runnymede, The Junction North",43.673185,-79.487262,4,Coffee Shop,Pizza Place,Brewery,Park,Athletics & Sports,Gas Station,Beer Store,Sandwich Place,Bus Line,Convenience Store
4,M9N,York,Weston,43.706876,-79.518188,0,Train Station,Pharmacy,Skating Rink,Discount Store,Diner,Jewelry Store,Coffee Shop,Furniture / Home Store,Pizza Place,Restaurant


In [301]:
map(YORK_NEIGH_MERGED,5)

In [294]:
YORK_NEIGH_MERGED.loc[YORK_NEIGH_MERGED['Cluster_Labels'] == 0, YORK_NEIGH_MERGED.columns[[2] + list(range(6, YORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
4,Weston,Train Station,Pharmacy,Skating Rink,Discount Store,Diner,Jewelry Store,Coffee Shop,Furniture / Home Store,Pizza Place,Restaurant


In [295]:
YORK_NEIGH_MERGED.loc[YORK_NEIGH_MERGED['Cluster_Labels'] == 1, YORK_NEIGH_MERGED.columns[[2] + list(range(6, YORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
2,"Del Ray, Mount Dennis, Keelsdale and Silverthorn",Furniture / Home Store,Grocery Store,Gas Station,Shopping Mall,Dessert Shop,Playground,Discount Store,Sandwich Place,Italian Restaurant,Fast Food Restaurant


In [296]:
YORK_NEIGH_MERGED.loc[YORK_NEIGH_MERGED['Cluster_Labels'] == 2, YORK_NEIGH_MERGED.columns[[2] + list(range(6, YORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
1,Caledonia-Fairbanks,Pharmacy,Park,Bus Stop,Pizza Place,Fast Food Restaurant,Mexican Restaurant,Japanese Restaurant,Grocery Store,Food Truck,Women's Store


In [297]:
YORK_NEIGH_MERGED.loc[YORK_NEIGH_MERGED['Cluster_Labels'] == 3, YORK_NEIGH_MERGED.columns[[2] + list(range(6, YORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
0,Humewood-Cedarvale,Pizza Place,Grocery Store,Convenience Store,Coffee Shop,Optical Shop,Gastropub,Deli / Bodega,Hockey Arena,Dance Studio,Intersection


In [298]:
YORK_NEIGH_MERGED.loc[YORK_NEIGH_MERGED['Cluster_Labels'] == 4, YORK_NEIGH_MERGED.columns[[2] + list(range(6, YORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
3,"Runnymede, The Junction North",Coffee Shop,Pizza Place,Brewery,Park,Athletics & Sports,Gas Station,Beer Store,Sandwich Place,Bus Line,Convenience Store


In [299]:
YORK_NEIGH_MERGED.loc[YORK_NEIGH_MERGED['Cluster_Labels'] == 5, YORK_NEIGH_MERGED.columns[[2] + list(range(6, YORK_NEIGH_MERGED.shape[1]))]]

Unnamed: 0,Neighbourhood_Name,1th Most Common Venue,2th Most Common Venue,3th Most Common Venue,4th Most Common Venue,5th Most Common Venue,6th Most Common Venue,7th Most Common Venue,8th Most Common Venue,9th Most Common Venue,10th Most Common Venue
