# Eat Safe, Love

## Notebook Set Up

In [2]:
# Import dependencies
from pymongo import MongoClient
import pandas as pd
from pprint import pprint

In [3]:
# Create an instance of MongoClient
mongo = MongoClient(port=27017)

In [4]:
# assign the uk_food database to a variable name
db = mongo['uk_food']

In [5]:
# review the collections in our database
print(db.list_collection_names())

['establishments']


In [6]:
# assign the collection to a variable
establishments = db['establishments']

## Part 3: Exploratory Analysis
Unless otherwise stated, for each question: 
* Use `count_documents` to display the number of documents contained in the result.
* Display the first document in the results using `pprint`.
* Convert the result to a Pandas DataFrame, print the number of rows in the DataFrame, and display the first 10 rows.

### 1. Which establishments have a hygiene score equal to 20?

In [7]:
# Find the establishments with a hygiene score of 20
query = {
    'scores.Hygiene':20
}
results = establishments.find(query)
# Use count_documents to display the number of documents in the result
count = establishments.count_documents(query)
print(f'There are {count} establishments with a hygiene score of 20.')
# Display the first document in the results using pprint
pprint(results[0])

There are 41 establishments with a hygiene score of 20.
{'AddressLine1': '5-6 Southfields Road',
 'AddressLine2': 'Eastbourne',
 'AddressLine3': 'East Sussex',
 'AddressLine4': '',
 'BusinessName': 'The Chase Rest Home',
 'BusinessType': 'Caring Premises',
 'BusinessTypeID': 5,
 'ChangesByServerID': 0,
 'Distance': 4613.888288172291,
 'FHRSID': 110681,
 'LocalAuthorityBusinessID': '4029',
 'LocalAuthorityCode': '102',
 'LocalAuthorityEmailAddress': 'Customerfirst@eastbourne.gov.uk',
 'LocalAuthorityName': 'Eastbourne',
 'LocalAuthorityWebSite': 'http://www.eastbourne.gov.uk/foodratings',
 'NewRatingPending': False,
 'Phone': '',
 'PostCode': 'BN21 1BU',
 'RatingDate': '2021-09-23T00:00:00',
 'RatingKey': 'fhrs_0_en-gb',
 'RatingValue': 0,
 'RightToReply': '',
 'SchemeType': 'FHRS',
 '_id': ObjectId('65f2d1bbc93348ed384bd1ce'),
 'geocode': {'latitude': 50.769705, 'longitude': 0.27694},
 'links': [{'href': 'https://api.ratings.food.gov.uk/establishments/110681',
            'rel': 'self'

In [8]:
# Convert the result to a Pandas DataFrame
hygiene_df = pd.json_normalize(results)
# Display the number of rows in the DataFrame
print(f'Added {len(hygiene_df)} fields to hygiene_df')
# Display the first 10 rows of the DataFrame
hygiene_df.head(10)

Added 41 fields to hygiene_df


Unnamed: 0,_id,FHRSID,ChangesByServerID,LocalAuthorityBusinessID,BusinessName,BusinessType,BusinessTypeID,AddressLine1,AddressLine2,AddressLine3,...,geocode.longitude,geocode.latitude,meta.dataSource,meta.extractDate,meta.itemCount,meta.returncode,meta.totalCount,meta.totalPages,meta.pageSize,meta.pageNumber
0,65f2d1bbc93348ed384bd1ce,110681,0,4029,The Chase Rest Home,Caring Premises,5,5-6 Southfields Road,Eastbourne,East Sussex,...,0.27694,50.769705,,0001-01-01T00:00:00,0,,0,0,0,0
1,65f2d1bbc93348ed384bd54f,612039,0,1970/FOOD,Brenalwood,Caring Premises,5,Hall Lane,Walton-on-the-Naze,Essex,...,1.278721,51.857536,,0001-01-01T00:00:00,0,,0,0,0,0
2,65f2d1bbc93348ed384bd857,730933,0,1698/FOOD,Melrose Hotel,Hotel/bed & breakfast/guest house,7842,53 Marine Parade East,Clacton On Sea,Essex,...,1.15927,51.789429,,0001-01-01T00:00:00,0,,0,0,0,0
3,65f2d1bbc93348ed384bda43,172735,0,PI/000023858,Seaford Pizza,Takeaway/sandwich shop,7844,4 High Street,Seaford,East Sussex,...,0.10202,50.770885,,0001-01-01T00:00:00,0,,0,0,0,0
4,65f2d1bbc93348ed384bda56,172953,0,PI/000024532,Golden Palace,Restaurant/Cafe/Canteen,1,5 South Street,Seaford,East Sussex,...,0.101446,50.770724,,0001-01-01T00:00:00,0,,0,0,0,0
5,65f2d1bbc93348ed384be3f5,512854,0,12/00816/BUTH,Ashby's Butchers,Retailers - other,4613,777 Southchurch Road,Southend-On-Sea,Essex,...,0.736349,51.541448,,0001-01-01T00:00:00,0,,0,0,0,0
6,65f2d1bbc93348ed384be624,1537089,0,22/00224/RESTUN,South Sea Express Cuisine,Restaurant/Cafe/Canteen,1,33 Alexandra Street,Southend-on-sea,Essex,...,0.712167,51.535007,,0001-01-01T00:00:00,0,,0,0,0,0
7,65f2d1bbc93348ed384bfb4b,155648,0,EH/00006058,Golden Palace,Takeaway/sandwich shop,7844,7 London Road,Rayleigh,Essex,...,0.602364,51.591515,,0001-01-01T00:00:00,0,,0,0,0,0
8,65f2d1bbc93348ed384bff82,1012883,0,17/00110/MIXED/S,The Tulip Tree,Restaurant/Cafe/Canteen,1,3 The Village,Chiddingstone,KENT,...,0.14645,51.185947,,0001-01-01T00:00:00,0,,0,0,0,0
9,65f2d1bbc93348ed384c0795,644109,0,41811,F & S,Retailers - other,4613,,81 Southernhay,Basildon,...,0.462307,51.57005,,0001-01-01T00:00:00,0,,0,0,0,0


### 2. Which establishments in London have a `RatingValue` greater than or equal to 4?

In [21]:
# Find the establishments with London as the Local Authority and has a RatingValue greater than or equal to 4.
query = {
    'RatingValue':{'$gte':4}
}
results = establishments.find(query)
# Use count_documents to display the number of documents in the result
count = establishments.count_documents(query)
print(f'There are {count} establishments with a rating value greater than or equal to 4.')
# Display the first document in the results using pprint
pprint(results[0])

There are 31257 establishments with a rating value greater than or equal to 4.
{'AddressLine1': 'East Cliff Pavilion',
 'AddressLine2': 'Wear Bay Road',
 'AddressLine3': 'Folkestone',
 'AddressLine4': 'Kent',
 'BusinessName': 'The Pavilion',
 'BusinessType': 'Restaurant/Cafe/Canteen',
 'BusinessTypeID': 1,
 'ChangesByServerID': 0,
 'Distance': 4591.765489457773,
 'FHRSID': 1043695,
 'LocalAuthorityBusinessID': 'PI/000073616',
 'LocalAuthorityCode': '188',
 'LocalAuthorityEmailAddress': 'foodteam@folkestone-hythe.gov.uk',
 'LocalAuthorityName': 'Folkestone and Hythe',
 'LocalAuthorityWebSite': 'http://www.folkestone-hythe.gov.uk',
 'NewRatingPending': False,
 'Phone': '',
 'PostCode': 'CT19 6BL',
 'RatingDate': '2018-04-04T00:00:00',
 'RatingKey': 'fhrs_5_en-gb',
 'RatingValue': 5,
 'RightToReply': '',
 'SchemeType': 'FHRS',
 '_id': ObjectId('65f2d1bac93348ed384bb69a'),
 'geocode': {'latitude': 51.083812, 'longitude': 1.195625},
 'links': [{'href': 'https://api.ratings.food.gov.uk/estab

In [22]:
# Convert the result to a Pandas DataFrame
rating_df = pd.json_normalize(results)
# Display the number of rows in the DataFrame
print(f'{len(rating_df)} items have been added to rating_df')
# Display the first 10 rows of the DataFrame
rating_df.head(10)

31257 items have been added to rating_df


Unnamed: 0,_id,FHRSID,ChangesByServerID,LocalAuthorityBusinessID,BusinessName,BusinessType,BusinessTypeID,AddressLine1,AddressLine2,AddressLine3,...,geocode.longitude,geocode.latitude,meta.dataSource,meta.extractDate,meta.itemCount,meta.returncode,meta.totalCount,meta.totalPages,meta.pageSize,meta.pageNumber
0,65f2d1bac93348ed384bb69a,1043695,0,PI/000073616,The Pavilion,Restaurant/Cafe/Canteen,1,East Cliff Pavilion,Wear Bay Road,Folkestone,...,1.195625,51.083812,,0001-01-01T00:00:00,0,,0,0,0,0
1,65f2d1bac93348ed384bb69b,289560,0,PI/000039927,Mariner,Pub/bar/nightclub,7843,16 The Stade,Folkestone,Kent,...,1.188537,51.08084,,0001-01-01T00:00:00,0,,0,0,0,0
2,65f2d1bac93348ed384bb69c,289352,0,PI/000002460,The Ship,Pub/bar/nightclub,7843,23 The Stade,Folkestone,Kent,...,1.188537,51.08084,,0001-01-01T00:00:00,0,,0,0,0,0
3,65f2d1bac93348ed384bb69d,344689,0,PI/000002095,Folkestone Trawlers Shop,Retailers - other,4613,1 The Stade,Folkestone,Kent,...,1.188537,51.08084,,0001-01-01T00:00:00,0,,0,0,0,0
4,65f2d1bac93348ed384bb69e,987206,0,PI/000075655,The Ships Galley,Pub/bar/nightclub,7843,The Ship,23 The Stade,Folkestone,...,1.188537,51.08084,,0001-01-01T00:00:00,0,,0,0,0,0
5,65f2d1bac93348ed384bb6a0,647177,0,PI/000041489,Wear Bay Bowls Club,Pub/bar/nightclub,7843,Wear Bay Road,Folkestone,Kent,...,1.196408,51.086058,,0001-01-01T00:00:00,0,,0,0,0,0
6,65f2d1bac93348ed384bb6a2,289353,0,PI/000002468,St Marys COE (aided) Primary School,School/college/university,7845,St Marys Church Of England Primary School,Warren Road,Folkestone,...,1.194762,51.085797,,0001-01-01T00:00:00,0,,0,0,0,0
7,65f2d1bac93348ed384bb6a5,1043701,0,PI/000076360,Pick Up Pintxos,Takeaway/sandwich shop,7844,Folkestone Harbour,Harbour Approach Road,Folkestone,...,1.185903,51.078352,,0001-01-01T00:00:00,0,,0,0,0,0
8,65f2d1bac93348ed384bb6a6,894592,0,PI/000074396,Docker,Retailers - other,4613,Folkestone Harbour,Harbour Approach Road,Folkestone,...,1.185903,51.078352,,0001-01-01T00:00:00,0,,0,0,0,0
9,65f2d1bac93348ed384bb6a7,805702,0,PI/000073219,Dr Legumes - Harbour Arm,Restaurant/Cafe/Canteen,1,Folkestone Harbour,Harbour Approach Road,Folkestone,...,1.185903,51.078352,,0001-01-01T00:00:00,0,,0,0,0,0


### 3. What are the top 5 establishments with a `RatingValue` rating value of 5, sorted by lowest hygiene score, nearest to the new restaurant added, "Penang Flavours"?

In [68]:
# Search within 0.01 degree on either side of the latitude and longitude.
# Rating value must equal 5
# Sort by hygiene score

degree_search = 0.01
latitude_result = establishments.find_one({'BusinessName':'Penang Flavours'},{'geocode.latitude':1})
longitude_result = establishments.find_one({'BusinessName':'Penang Flavours'},{'geocode.longitude':1})
latitude = latitude_result['geocode']['latitude']
longitude = longitude_result['geocode']['longitude']

query = {
    'RatingValue':5,
    'geocode.latitude':{'$gt':(latitude-degree_search), '$lt':(latitude+degree_search)},
    'geocode.longitude':{'$gt':(longitude-degree_search), '$lt':(longitude+degree_search)}
}

sort = {
    'hygiene':-1
}
limit = 5

results = list(establishments.find(query).sort(sort).limit(limit))

# Print the results
pprint(results)


[{'AddressLine1': '130 - 132 Plumstead High Street',
  'AddressLine2': '',
  'AddressLine3': 'Plumstead',
  'AddressLine4': 'Greenwich',
  'BusinessName': 'Volunteer',
  'BusinessType': 'Pub/bar/nightclub',
  'BusinessTypeID': 7843,
  'ChangesByServerID': 0,
  'Distance': 4646.965634598608,
  'FHRSID': 694609,
  'LocalAuthorityBusinessID': 'PI/000116619',
  'LocalAuthorityCode': '511',
  'LocalAuthorityEmailAddress': 'health@royalgreenwich.gov.uk',
  'LocalAuthorityName': 'Greenwich',
  'LocalAuthorityWebSite': 'http://www.royalgreenwich.gov.uk',
  'NewRatingPending': False,
  'Phone': '',
  'PostCode': 'SE18 1JQ',
  'RatingDate': '2019-08-05T00:00:00',
  'RatingKey': 'fhrs_5_en-gb',
  'RatingValue': 5,
  'RightToReply': '',
  'SchemeType': 'FHRS',
  '_id': ObjectId('65f2d1bcc93348ed384c2a2b'),
  'geocode': {'latitude': 51.4873437, 'longitude': 0.09208},
  'links': [{'href': 'http://api.ratings.food.gov.uk/establishments/694609',
             'rel': 'self'}],
  'meta': {'dataSource': N

In [69]:
# Convert result to Pandas DataFrame
query_df = pd.json_normalize(results)
print(f'{len(query_df)} items have been added to query_df')
query_df.head()


5 items have been added to query_df


Unnamed: 0,_id,FHRSID,ChangesByServerID,LocalAuthorityBusinessID,BusinessName,BusinessType,BusinessTypeID,AddressLine1,AddressLine2,AddressLine3,...,geocode.longitude,geocode.latitude,meta.dataSource,meta.extractDate,meta.itemCount,meta.returncode,meta.totalCount,meta.totalPages,meta.pageSize,meta.pageNumber
0,65f2d1bcc93348ed384c2a2b,694609,0,PI/000116619,Volunteer,Pub/bar/nightclub,7843,130 - 132 Plumstead High Street,,Plumstead,...,0.09208,51.487344,,0001-01-01T00:00:00,0,,0,0,0,0
1,65f2d1bcc93348ed384c2a42,695241,0,PI/000179088,Plumstead Manor Nursery,Caring Premises,5,Plumstead Manor School Old Mill Road,,Plumstead,...,0.085994,51.481518,,0001-01-01T00:00:00,0,,0,0,0,0
2,65f2d1bcc93348ed384c29ff,695223,0,PI/000178842,Iceland,Retailers - supermarkets/hypermarkets,7840,144 - 146 Plumstead High Street,,Plumstead,...,0.09242,51.487148,,0001-01-01T00:00:00,0,,0,0,0,0
3,65f2d1bcc93348ed384c29d8,1069652,0,PI/000206841,TIWA N TIWA African Restaurant Ltd,Restaurant/Cafe/Canteen,1,152 Plumstead High Street,,Plumstead,...,0.092743,51.487035,,0001-01-01T00:00:00,0,,0,0,0,0
4,65f2d1bcc93348ed384c2a15,1380578,0,14425,Howe and Co Fish and Chips - Van 17,Mobile caterer,7846,Restaurant And Premises 107A Plumstead High St...,,Plumstead,...,0.092537,51.487534,,0001-01-01T00:00:00,0,,0,0,0,0


### 4. How many establishments in each Local Authority area have a hygiene score of 0?

In [83]:
# Create a pipeline that:
# 1. Matches establishments with a hygiene score of 0
match_query = {
    '$match':{'scores.Hygiene':0}
}
# 2. Groups the matches by Local Authority
group_query = {
    '$group':{'_id':{'Local Authority':'$LocalAuthorityName'},
              'count':{'$sum':1}}
}
# 3. Sorts the matches from highest to lowest
sort_query = {
    '$sort':{'count':-1}
}

# Print the number of documents in the result
pipeline = [match_query, group_query, sort_query]
results = list(establishments.aggregate(pipeline))

# Print the first 10 results
for i in range(10):
    pprint(results[i])


{'_id': {'Local Authority': 'Thanet'}, 'count': 1130}
{'_id': {'Local Authority': 'Greenwich'}, 'count': 882}
{'_id': {'Local Authority': 'Maidstone'}, 'count': 713}
{'_id': {'Local Authority': 'Newham'}, 'count': 711}
{'_id': {'Local Authority': 'Swale'}, 'count': 686}
{'_id': {'Local Authority': 'Chelmsford'}, 'count': 680}
{'_id': {'Local Authority': 'Medway'}, 'count': 672}
{'_id': {'Local Authority': 'Bexley'}, 'count': 607}
{'_id': {'Local Authority': 'Southend-On-Sea'}, 'count': 586}
{'_id': {'Local Authority': 'Tendring'}, 'count': 542}


In [84]:
# Convert the result to a Pandas DataFrame
lowest_hygiene_df = pd.json_normalize(results)
# Display the number of rows in the DataFrame
print(f'{len(lowest_hygiene_df)} items have been added to lowest_hygiene_df')
# Display the first 10 rows of the DataFrame
lowest_hygiene_df.head(10)

55 items have been added to lowest_hygiene_df


Unnamed: 0,count,_id.Local Authority
0,1130,Thanet
1,882,Greenwich
2,713,Maidstone
3,711,Newham
4,686,Swale
5,680,Chelmsford
6,672,Medway
7,607,Bexley
8,586,Southend-On-Sea
9,542,Tendring
