# Eat Safe, Love

## Notebook Set Up

In [271]:
# Import dependencies
from pymongo import MongoClient
from pprint import pprint
import pandas as pd

In [272]:
# Create an instance of MongoClient
mongo = MongoClient(port=27017)

In [273]:
# assign the uk_food database to a variable name
db = mongo['uk_food']

In [274]:
# review the collections in our database
print(db.list_collection_names())

['establishments']


In [275]:
# assign the collection to a variable
establishments = db['establishments']

## Part 3: Exploratory Analysis
Unless otherwise stated, for each question: 
* Use `count_documents` to display the number of documents contained in the result.
* Display the first document in the results using `pprint`.
* Convert the result to a Pandas DataFrame, print the number of rows in the DataFrame, and display the first 10 rows.

### 1. Which establishments have a hygiene score equal to 20?

In [276]:
# Find the establishments with a hygiene score of 20
query = {'scores.Hygiene' : {'$eq' : 20},  }

# Use count_documents to display the number of documents in the result
print("Number of records in result:", establishments.count_documents(query))


Number of records in result: 41


In [277]:
# Display the first document using pprint

pprint(establishments.find_one(query))

{'AddressLine1': '5-6 Southfields Road',
 'AddressLine2': 'Eastbourne',
 'AddressLine3': 'East Sussex',
 'AddressLine4': '',
 'BusinessName': 'The Chase Rest Home',
 'BusinessType': 'Caring Premises',
 'BusinessTypeID': 5,
 'ChangesByServerID': 0,
 'Distance': 4613.888288172291,
 'FHRSID': 110681,
 'LocalAuthorityBusinessID': '4029',
 'LocalAuthorityCode': '102',
 'LocalAuthorityEmailAddress': 'Customerfirst@eastbourne.gov.uk',
 'LocalAuthorityName': 'Eastbourne',
 'LocalAuthorityWebSite': 'http://www.eastbourne.gov.uk/foodratings',
 'NewRatingPending': False,
 'Phone': '',
 'PostCode': 'BN21 1BU',
 'RatingDate': '2021-09-23T00:00:00',
 'RatingKey': 'fhrs_0_en-gb',
 'RatingValue': '0',
 'RightToReply': '',
 'SchemeType': 'FHRS',
 '_id': ObjectId('646ff9e34922150fc439dc07'),
 'geocode': {'latitude': 50.769705, 'longitude': 0.27694},
 'links': [{'href': 'https://api.ratings.food.gov.uk/establishments/110681',
            'rel': 'self'}],
 'meta': {'dataSource': None,
          'extractDa

In [278]:
# Convert the result to a Pandas DataFrame
results = establishments.find(query)
hygiene_equal_20_df = pd.DataFrame(results)

# Display the number of rows in the DataFrame
print("Rows in DataFrame: ", len(hygiene_equal_20_df))


Rows in DataFrame:  41


In [279]:
# Display the first 10 rows of the DataFrame
hygiene_equal_20_df.head(10)

Unnamed: 0,_id,FHRSID,ChangesByServerID,LocalAuthorityBusinessID,BusinessName,BusinessType,BusinessTypeID,AddressLine1,AddressLine2,AddressLine3,...,LocalAuthorityWebSite,LocalAuthorityEmailAddress,scores,SchemeType,geocode,RightToReply,Distance,NewRatingPending,meta,links
0,646ff9e34922150fc439dc07,110681,0,4029,The Chase Rest Home,Caring Premises,5,5-6 Southfields Road,Eastbourne,East Sussex,...,http://www.eastbourne.gov.uk/foodratings,Customerfirst@eastbourne.gov.uk,"{'Hygiene': 20, 'Structural': 20, 'ConfidenceI...",FHRS,"{'longitude': 0.27694, 'latitude': 50.769705}",,4613.888288,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
1,646ff9e34922150fc439df88,612039,0,1970/FOOD,Brenalwood,Caring Premises,5,Hall Lane,Walton-on-the-Naze,Essex,...,http://www.tendringdc.gov.uk/,fhsadmin@tendringdc.gov.uk,"{'Hygiene': 20, 'Structural': 15, 'ConfidenceI...",FHRS,"{'longitude': 1.278721, 'latitude': 51.857536}",,4617.965824,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
2,646ff9e34922150fc439e297,730933,0,1698/FOOD,Melrose Hotel,Hotel/bed & breakfast/guest house,7842,53 Marine Parade East,Clacton On Sea,Essex,...,http://www.tendringdc.gov.uk/,fhsadmin@tendringdc.gov.uk,"{'Hygiene': 20, 'Structural': 20, 'ConfidenceI...",FHRS,"{'longitude': 1.15927, 'latitude': 51.789429}",,4619.656144,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
3,646ff9e34922150fc439e477,172735,0,PI/000023858,Seaford Pizza,Takeaway/sandwich shop,7844,4 High Street,Seaford,East Sussex,...,http://www.lewes-eastbourne.gov.uk/,ehealth.ldc@lewes-eastbourne.gov.uk,"{'Hygiene': 20, 'Structural': 10, 'ConfidenceI...",FHRS,"{'longitude': 0.10202, 'latitude': 50.770885}",,4620.421725,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
4,646ff9e34922150fc439e491,172953,0,PI/000024532,Golden Palace,Restaurant/Cafe/Canteen,1,5 South Street,Seaford,East Sussex,...,http://www.lewes-eastbourne.gov.uk/,ehealth.ldc@lewes-eastbourne.gov.uk,"{'Hygiene': 20, 'Structural': 10, 'ConfidenceI...",FHRS,"{'longitude': 0.101446, 'latitude': 50.770724}",,4620.437179,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
5,646ff9e34922150fc439ee2b,512854,0,12/00816/BUTH,Ashby's Butchers,Retailers - other,4613,777 Southchurch Road,Southend-On-Sea,Essex,...,http://www.southend.gov.uk,EnvironmentalHealth@southend.gov.uk,"{'Hygiene': 20, 'Structural': 20, 'ConfidenceI...",FHRS,"{'longitude': 0.736349, 'latitude': 51.541448}",,4625.565258,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
6,646ff9e34922150fc439f056,1537089,0,22/00224/RESTUN,South Sea Express Cuisine,Restaurant/Cafe/Canteen,1,33 Alexandra Street,Southend-on-sea,Essex,...,http://www.southend.gov.uk,EnvironmentalHealth@southend.gov.uk,"{'Hygiene': 20, 'Structural': 20, 'ConfidenceI...",FHRS,"{'longitude': 0.7121671, 'latitude': 51.5350065}",,4626.200132,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
7,646ff9e34922150fc43a057a,155648,0,EH/00006058,Golden Palace,Takeaway/sandwich shop,7844,7 London Road,Rayleigh,Essex,...,http://www.rochford.gov.uk,customerservices@rochford.gov.uk,"{'Hygiene': 20, 'Structural': 15, 'ConfidenceI...",FHRS,"{'longitude': 0.602364, 'latitude': 51.591515}",,4632.27689,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
8,646ff9e34922150fc43a09bf,1012883,0,17/00110/MIXED/S,The Tulip Tree,Restaurant/Cafe/Canteen,1,3 The Village,Chiddingstone,KENT,...,http://www.sevenoaks.gov.uk/,environmental.health@sevenoaks.gov.uk,"{'Hygiene': 20, 'Structural': 5, 'ConfidenceIn...",FHRS,"{'longitude': 0.146449998021126, 'latitude': 5...",,4633.934041,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
9,646ff9e34922150fc43a11cc,644109,0,41811,F & S,Retailers - other,4613,,81 Southernhay,Basildon,...,http://www.basildon.gov.uk,ehs@basildon.gov.uk,"{'Hygiene': 20, 'Structural': 20, 'ConfidenceI...",FHRS,"{'longitude': 0.462307, 'latitude': 51.57005}",,4636.552523,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."


### 2. Which establishments in London have a `RatingValue` greater than or equal to 4?

In [285]:
# Find the establishments with London as the Local Authority and has a RatingValue greater than or equal to 4.

query = {'LocalAuthorityName' : {'$regex' : 'London'}, 'RatingValue' : {'$gte' : '4'}}

projection = {'BusinessName': 1, '_id' : 0}

results = establishments.find(query, projection)
# Use count_documents to display the number of documents in the result

# print("Number of records in result:", establishments.count_documents(query))
for row in results:
    pprint(row)


{'BusinessName': "Charlie's"}
{'BusinessName': 'Mv City Cruises Erasmus'}
{'BusinessName': 'Benfleet Motor Yacht Club'}
{'BusinessName': 'Tilbury Seafarers Centre'}
{'BusinessName': 'Coombs Catering t/a The Lock and Key'}
{'BusinessName': 'Mv Valulla'}
{'BusinessName': 'Tereza Joanne'}
{'BusinessName': 'Froottree'}
{'BusinessName': 'Brick Lane Brews'}
{'BusinessName': 'The Nuance Group (UK) Limited'}
{'BusinessName': 'WH Smith'}
{'BusinessName': 'City Bar & Grill'}
{'BusinessName': 'Caffè Nero'}
{'BusinessName': 'Jet Centre'}
{'BusinessName': 'Mv Sunborn Yacht Hotel'}
{'BusinessName': 'Good Hotel London'}
{'BusinessName': 'La Nonna lina'}
{'BusinessName': 'Wake Up Docklands Limited'}
{'BusinessName': 'MV Venus Clipper'}
{'BusinessName': 'MV Typhoon clipper'}
{'BusinessName': 'MV Moon clipper'}
{'BusinessName': 'MV Jupiter clipper'}
{'BusinessName': 'MV Monsoon clipper'}
{'BusinessName': 'MV Meteor clipper'}
{'BusinessName': 'MV Tornado clipper'}
{'BusinessName': 'MV Cyclone clipper'}
{

In [281]:
# Display the first document in the results using pprint

pprint(establishments.find_one(query))

{'AddressLine1': 'Oak Apple Farm Building 103 Sheernes Docks',
 'AddressLine2': 'Sheppy Kent',
 'AddressLine3': '',
 'AddressLine4': '',
 'BusinessName': "Charlie's",
 'BusinessType': 'Other catering premises',
 'BusinessTypeID': 7841,
 'ChangesByServerID': 0,
 'Distance': 4627.439467780196,
 'FHRSID': 621707,
 'LocalAuthorityBusinessID': 'PI/000025307',
 'LocalAuthorityCode': '508',
 'LocalAuthorityEmailAddress': 'publicprotection@cityoflondon.gov.uk',
 'LocalAuthorityName': 'City of London Corporation',
 'LocalAuthorityWebSite': 'http://www.cityoflondon.gov.uk/Corporation/homepage.htm',
 'NewRatingPending': False,
 'Phone': '',
 'PostCode': 'ME12',
 'RatingDate': '2021-10-18T00:00:00',
 'RatingKey': 'fhrs_4_en-gb',
 'RatingValue': '4',
 'RightToReply': '',
 'SchemeType': 'FHRS',
 '_id': ObjectId('646ff9e34922150fc439f624'),
 'geocode': {'latitude': 51.369321, 'longitude': 0.508551},
 'links': [{'href': 'https://api.ratings.food.gov.uk/establishments/621707',
            'rel': 'self'

In [286]:
# Check that the new restaurant was inserted
query = establishments.count_documents({'BusinessName' : 'Coombs Catering t/a The Lock and Keys'})

query

0

In [287]:
# Convert the result to a Pandas DataFrame

London = establishments.find(query)
London_rating_4plus_df = pd.DataFrame(London)


# Display the number of rows in the DataFrame

print("Rows in DataFrame: ", len(London_rating_4plus_df))


TypeError: filter must be an instance of dict, bson.son.SON, or any other type that inherits from collections.Mapping

In [None]:
# Display the first 10 rows of the DataFrame

London_rating_4plus_df.head(10)


### 3. What are the top 5 establishments with a `RatingValue` rating value of '5', sorted by lowest hygiene score, nearest to the new restaurant added, "Penang Flavours"?

In [None]:
# Search within 0.01 degree on either side of the latitude and longitude.
# Rating value must equal 5
# Sort by hygiene score
# distance for search range defined


degree_search = 0.01
latitude = 51.369321
longitude = 0.08384


query = { 
    'geocode.latitude' : {'$gte' : latitude - degree_search, '$lte' : latitude + degree_search}, 
    'geocode.longitude' : {'$gte' : longitude - degree_search, '$lte' : longitude + degree_search}, 
    'RatingValue' : '5'
    }
sort = [('scores.Hygiene', 1)] 
limit = 5


nearby_restuarants = list(establishments.find(query).sort(sort).limit(limit))

# Pretty print the results
pprint(nearby_restuarants)

[{'AddressLine1': '2 - 3 Crescent Way',
  'AddressLine2': 'Orpington',
  'AddressLine3': '',
  'AddressLine4': '',
  'BusinessName': 'Co-op',
  'BusinessType': 'Retailers - supermarkets/hypermarkets',
  'BusinessTypeID': 7840,
  'ChangesByServerID': 0,
  'Distance': 4642.473269874587,
  'FHRSID': 357720,
  'LocalAuthorityBusinessID': '00000/0001/0/630',
  'LocalAuthorityCode': '505',
  'LocalAuthorityEmailAddress': 'food@bromley.gov.uk',
  'LocalAuthorityName': 'Bromley',
  'LocalAuthorityWebSite': 'http://www.bromley.gov.uk',
  'NewRatingPending': False,
  'Phone': '',
  'PostCode': 'BR6 9LP',
  'RatingDate': '2018-12-05T00:00:00',
  'RatingKey': 'fhrs_5_en-gb',
  'RatingValue': '5',
  'RightToReply': '',
  'SchemeType': 'FHRS',
  '_id': ObjectId('646ff9e44922150fc43a1fcc'),
  'geocode': {'latitude': 51.360803, 'longitude': 0.088136},
  'links': [{'href': 'http://api.ratings.food.gov.uk/establishments/357720',
             'rel': 'self'}],
  'meta': {'dataSource': None,
           'ex

In [None]:
# Convert result to Pandas DataFrame

nearby_restuarants_df = pd.DataFrame(nearby_restuarants)

print("Rows in DataFrame: ", len(nearby_restuarants_df))


# Display the number of rows in the DataFrame?

nearby_restuarants_df.head()


Rows in DataFrame:  5


Unnamed: 0,_id,FHRSID,ChangesByServerID,LocalAuthorityBusinessID,BusinessName,BusinessType,BusinessTypeID,AddressLine1,AddressLine2,AddressLine3,...,LocalAuthorityWebSite,LocalAuthorityEmailAddress,scores,SchemeType,geocode,RightToReply,Distance,NewRatingPending,meta,links
0,646ff9e44922150fc43a1fcc,357720,0,00000/0001/0/630,Co-op,Retailers - supermarkets/hypermarkets,7840,2 - 3 Crescent Way,Orpington,,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 0, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.088136, 'latitude': 51.360803}",,4642.47327,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
1,646ff9e44922150fc43a1fd1,357724,0,00000/0001/0/638,Porters Produce,Retailers - other,4613,9 Crescent Way,Orpington,,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 0, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.088136, 'latitude': 51.360803}",,4642.47327,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
2,646ff9e44922150fc43a1fdd,554943,0,04/00122/MIXED,Holy Innocents Catholic Church,Other catering premises,7841,Holy Innocents Presbytery,Strickland Way,Orpington,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 0, 'Structural': 0, 'ConfidenceInM...",FHRS,"{'longitude': 0.091066, 'latitude': 51.364249}",,4642.492258,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
3,646ff9e44922150fc43a1f9d,358298,0,04/00154/MIXED,St Christopher's Bromley,Caring Premises,5,Caritas House,Tregony Road,Orpington,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 0, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.093466, 'latitude': 51.364269}",,4642.405194,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
4,646ff9e44922150fc43a1fce,357723,0,00000/0001/0/635,"Tams Pizza, Food & Wine",Retailers - other,4613,7 Crescent Way,Orpington,,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 0, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.088136, 'latitude': 51.360803}",,4642.47327,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."


### 4. How many establishments in each Local Authority area have a hygiene score of 0?

In [None]:
# Create a pipeline that: 
# 1. Matches establishments with a hygiene score of 0
match_query = {'$match': {'scores.Hygiene': 0}}

# 2. Groups the matches by Local Authority
group_query = {'$group': {'_id' : '$LocalAuthorityName', 
                          'count': { '$sum': 1 }}}

# 3. Sorts the matches from highest to lowest
sort_values = {'$sort': { 'count': -1, '_id': 1 }}

# Print the number of documents in the result
pipeline = [match_query, group_query, sort_values]

hygenic_establishments = list(establishments.aggregate(pipeline))

# Print the first 10 results
print("Number of establishments in results: ", len(hygenic_establishments))

pprint(hygenic_establishments[0:10])

Number of establishments in results:  55
[{'_id': 'Thanet', 'count': 1130},
 {'_id': 'Greenwich', 'count': 882},
 {'_id': 'Maidstone', 'count': 713},
 {'_id': 'Newham', 'count': 711},
 {'_id': 'Swale', 'count': 686},
 {'_id': 'Chelmsford', 'count': 680},
 {'_id': 'Medway', 'count': 672},
 {'_id': 'Bexley', 'count': 607},
 {'_id': 'Southend-On-Sea', 'count': 586},
 {'_id': 'Tendring', 'count': 542}]


In [None]:
# Convert the result to a Pandas DataFrame
hygenic_establishments_df = pd.DataFrame(hygenic_establishments)


# Display the number of rows in the DataFrame
print("Rows in DataFrame: ", len(hygenic_establishments_df))




Rows in DataFrame:  55


In [None]:
# Display the first 10 rows of the DataFrame
hygenic_establishments_df.head(10)

Unnamed: 0,_id,count
0,Thanet,1130
1,Greenwich,882
2,Maidstone,713
3,Newham,711
4,Swale,686
5,Chelmsford,680
6,Medway,672
7,Bexley,607
8,Southend-On-Sea,586
9,Tendring,542
