# Eat Safe, Love

## Notebook Set Up

### MW - Dataset imported with `mongoimport --type json -d uk_food -c est --drop --jsonArray establishments.json'

In [1]:
## MW
# Dataset imported with `mongoimport --type json -d uk_food -c est --drop --jsonArray establishments.json'

In [2]:
# Import dependencies
from pymongo import MongoClient
from pprint import pprint

## MW - import pandas for dataframe & matplotlib for charting
import pandas as pd
import matplotlib as plt

In [3]:
# Create an instance of MongoClient
mongo = MongoClient(port=27017)


In [4]:
# assign the uk_food database to a variable name
ukfd_db = mongo['uk_food']


In [5]:
# review the collections in our database
print(ukfd_db.list_collection_names())


['est', 'establishments']


In [6]:
# assign the collection to a variable
est_p2 = ukfd_db['est']

In [7]:
## MW print one document for reference
est_p2.find_one()

{'_id': ObjectId('64e09b3b656c004597010051'),
 'FHRSID': 254250,
 'ChangesByServerID': 0,
 'LocalAuthorityBusinessID': 'PI/000066174',
 'BusinessName': 'The Pines Calyx',
 'BusinessType': 'Other catering premises',
 'BusinessTypeID': 7841,
 'AddressLine1': 'The Pines Garden',
 'AddressLine2': 'Beach Road',
 'AddressLine3': 'St Margarets Bay',
 'AddressLine4': 'Kent',
 'PostCode': 'CT15 6DZ',
 'Phone': '',
 'RatingValue': '5',
 'RatingKey': 'fhrs_5_en-gb',
 'RatingDate': '2021-08-17T00:00:00',
 'LocalAuthorityCode': '182',
 'LocalAuthorityName': 'Dover',
 'LocalAuthorityWebSite': 'http://www.dover.gov.uk/',
 'LocalAuthorityEmailAddress': 'publicprotection@dover.gov.uk',
 'scores': {'Hygiene': 0, 'Structural': 0, 'ConfidenceInManagement': 0},
 'SchemeType': 'FHRS',
 'geocode': {'longitude': Decimal128('1.383298'),
  'latitude': Decimal128('51.148133')},
 'RightToReply': '',
 'Distance': 4587.362402580997,
 'NewRatingPending': False,
 'meta': {'dataSource': None,
  'extractDate': '0001-01

## Part 3: Exploratory Analysis
Unless otherwise stated, for each question: 
* Use `count_documents` to display the number of documents contained in the result.
* Display the first document in the results using `pprint`.
* Convert the result to a Pandas DataFrame, print the number of rows in the DataFrame, and display the first 10 rows.

### 1. Which establishments have a hygiene score equal to 20?

In [8]:
# Find the establishments with a hygiene score of 20
hyg_query = {'scores.Hygiene': {'$eq':20}}
hyg_qry1 = list(est_p2.find(hyg_query))

# Use count_documents to display the number of documents in the result
hyg_qry1_count = est_p2.count_documents(hyg_query)
hyg_qry1_count

41

In [9]:
# Display the first document in the results using pprint
pprint(hyg_qry1[0:1])

[{'AddressLine1': '5-6 Southfields Road',
  'AddressLine2': 'Eastbourne',
  'AddressLine3': 'East Sussex',
  'AddressLine4': '',
  'BusinessName': 'The Chase Rest Home',
  'BusinessType': 'Caring Premises',
  'BusinessTypeID': 5,
  'ChangesByServerID': 0,
  'Distance': 4613.888288172291,
  'FHRSID': 110681,
  'LocalAuthorityBusinessID': '4029',
  'LocalAuthorityCode': '102',
  'LocalAuthorityEmailAddress': 'Customerfirst@eastbourne.gov.uk',
  'LocalAuthorityName': 'Eastbourne',
  'LocalAuthorityWebSite': 'http://www.eastbourne.gov.uk/foodratings',
  'NewRatingPending': False,
  'Phone': '',
  'PostCode': 'BN21 1BU',
  'RatingDate': '2021-09-23T00:00:00',
  'RatingKey': 'fhrs_0_en-gb',
  'RatingValue': '0',
  'RightToReply': '',
  'SchemeType': 'FHRS',
  '_id': ObjectId('64e09b3e656c004597011e69'),
  'geocode': {'latitude': Decimal128('50.769705'),
              'longitude': Decimal128('0.27694')},
  'links': [{'href': 'https://api.ratings.food.gov.uk/establishments/110681',
           

In [10]:
# Convert the result to a Pandas DataFrame
hyg_df = pd.DataFrame(hyg_qry1)

# Display the number of rows in the DataFrame
print("No. of rows in dataframe ('hyg_df'):", len(hyg_df))

# Display the first 10 rows of the DataFrame
hyg_df.head(10)

No. of rows in dataframe ('hyg_df'): 41


Unnamed: 0,_id,FHRSID,ChangesByServerID,LocalAuthorityBusinessID,BusinessName,BusinessType,BusinessTypeID,AddressLine1,AddressLine2,AddressLine3,...,LocalAuthorityWebSite,LocalAuthorityEmailAddress,scores,SchemeType,geocode,RightToReply,Distance,NewRatingPending,meta,links
0,64e09b3e656c004597011e69,110681,0,4029,The Chase Rest Home,Caring Premises,5,5-6 Southfields Road,Eastbourne,East Sussex,...,http://www.eastbourne.gov.uk/foodratings,Customerfirst@eastbourne.gov.uk,"{'Hygiene': 20, 'Structural': 20, 'ConfidenceI...",FHRS,"{'longitude': 0.27694, 'latitude': 50.769705}",,4613.888288,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
1,64e09b3e656c0045970121ea,612039,0,1970/FOOD,Brenalwood,Caring Premises,5,Hall Lane,Walton-on-the-Naze,Essex,...,http://www.tendringdc.gov.uk/,fhsadmin@tendringdc.gov.uk,"{'Hygiene': 20, 'Structural': 15, 'ConfidenceI...",FHRS,"{'longitude': 1.278721, 'latitude': 51.857536}",,4617.965824,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
2,64e09b3e656c0045970124fe,730933,0,1698/FOOD,Melrose Hotel,Hotel/bed & breakfast/guest house,7842,53 Marine Parade East,Clacton On Sea,Essex,...,http://www.tendringdc.gov.uk/,fhsadmin@tendringdc.gov.uk,"{'Hygiene': 20, 'Structural': 20, 'ConfidenceI...",FHRS,"{'longitude': 1.15927, 'latitude': 51.789429}",,4619.656144,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
3,64e09b3e656c0045970126e2,172735,0,PI/000023858,Seaford Pizza,Takeaway/sandwich shop,7844,4 High Street,Seaford,East Sussex,...,http://www.lewes-eastbourne.gov.uk/,ehealth.ldc@lewes-eastbourne.gov.uk,"{'Hygiene': 20, 'Structural': 10, 'ConfidenceI...",FHRS,"{'longitude': 0.10202, 'latitude': 50.770885}",,4620.421725,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
4,64e09b3e656c0045970126f2,172953,0,PI/000024532,Golden Palace,Restaurant/Cafe/Canteen,1,5 South Street,Seaford,East Sussex,...,http://www.lewes-eastbourne.gov.uk/,ehealth.ldc@lewes-eastbourne.gov.uk,"{'Hygiene': 20, 'Structural': 10, 'ConfidenceI...",FHRS,"{'longitude': 0.101446, 'latitude': 50.770724}",,4620.437179,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
5,64e09b40656c004597013090,512854,0,12/00816/BUTH,Ashby's Butchers,Retailers - other,4613,777 Southchurch Road,Southend-On-Sea,Essex,...,http://www.southend.gov.uk,EnvironmentalHealth@southend.gov.uk,"{'Hygiene': 20, 'Structural': 20, 'ConfidenceI...",FHRS,"{'longitude': 0.736349, 'latitude': 51.541448}",,4625.565258,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
6,64e09b40656c0045970132af,1537089,0,22/00224/RESTUN,South Sea Express Cuisine,Restaurant/Cafe/Canteen,1,33 Alexandra Street,Southend-on-sea,Essex,...,http://www.southend.gov.uk,EnvironmentalHealth@southend.gov.uk,"{'Hygiene': 20, 'Structural': 20, 'ConfidenceI...",FHRS,"{'longitude': 0.7121671, 'latitude': 51.5350065}",,4626.200132,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
7,64e09b42656c0045970147dc,155648,0,EH/00006058,Golden Palace,Takeaway/sandwich shop,7844,7 London Road,Rayleigh,Essex,...,http://www.rochford.gov.uk,customerservices@rochford.gov.uk,"{'Hygiene': 20, 'Structural': 15, 'ConfidenceI...",FHRS,"{'longitude': 0.602364, 'latitude': 51.591515}",,4632.27689,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
8,64e09b43656c004597014c20,1012883,0,17/00110/MIXED/S,The Tulip Tree,Restaurant/Cafe/Canteen,1,3 The Village,Chiddingstone,KENT,...,http://www.sevenoaks.gov.uk/,environmental.health@sevenoaks.gov.uk,"{'Hygiene': 20, 'Structural': 5, 'ConfidenceIn...",FHRS,"{'longitude': 0.146449998021126, 'latitude': 5...",,4633.934041,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
9,64e09b43656c004597015433,644109,0,41811,F & S,Retailers - other,4613,,81 Southernhay,Basildon,...,http://www.basildon.gov.uk,ehs@basildon.gov.uk,"{'Hygiene': 20, 'Structural': 20, 'ConfidenceI...",FHRS,"{'longitude': 0.462307, 'latitude': 51.57005}",,4636.552523,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."


### 2. Which establishments in London have a `RatingValue` greater than or equal to 4

### MW - Wow what a brain teaser this one was!  I had to perform lots of checks before being able to answer the question.  I have left these in my project for later reference.  

In [11]:
## MW - Checking for establishments with Local Authority = London.  Results!
la_query = {'LocalAuthorityName':{'$regex':'London'}}
la_query_count =est_p2.count_documents(la_query)
print(la_query_count)

37


In [12]:
## MW - Checking for establishments with RatingValue => 4.  Oh what a horror.  
## MW - Down the rabbit hole I went.  But not alone!!!  Oh no, I took AskBCS with me.   
## MW - Step 1 - check values of RatingValue field. 
check = est_p2.find({},{'RatingValue':1})

for i in check:
    pprint(i)

{'RatingValue': '5', '_id': ObjectId('64e09b3b656c004597010051')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c004597010052')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c004597010053')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c004597010054')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c004597010055')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c004597010056')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c004597010057')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c004597010058')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c004597010059')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c00459701005a')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c00459701005b')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c00459701005c')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c00459701005d')}
{'RatingValue': '5', '_id': ObjectId('64e09b3b656c00459701005e')}
{'RatingValue': '4', '_id': ObjectId('64e09b3b656c00459701005f')}
{'RatingVa

{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ec6')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ec7')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ec8')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ec9')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011eca')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ecb')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ecc')}
{'RatingValue': '4', '_id': ObjectId('64e09b3e656c004597011ecd')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ece')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ecf')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ed0')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ed1')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ed2')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ed3')}
{'RatingValue': '5', '_id': ObjectId('64e09b3e656c004597011ed4')}
{'RatingVa

{'RatingValue': '5', '_id': ObjectId('64e09b41656c00459701390d')}
{'RatingValue': '5', '_id': ObjectId('64e09b41656c00459701390e')}
{'RatingValue': 'Exempt', '_id': ObjectId('64e09b41656c00459701390f')}
{'RatingValue': '5', '_id': ObjectId('64e09b41656c004597013910')}
{'RatingValue': 'Exempt', '_id': ObjectId('64e09b41656c004597013911')}
{'RatingValue': '5', '_id': ObjectId('64e09b41656c004597013912')}
{'RatingValue': '5', '_id': ObjectId('64e09b41656c004597013913')}
{'RatingValue': '5', '_id': ObjectId('64e09b41656c004597013914')}
{'RatingValue': 'Exempt', '_id': ObjectId('64e09b41656c004597013915')}
{'RatingValue': '5', '_id': ObjectId('64e09b41656c004597013916')}
{'RatingValue': '5', '_id': ObjectId('64e09b41656c004597013917')}
{'RatingValue': '5', '_id': ObjectId('64e09b41656c004597013918')}
{'RatingValue': '5', '_id': ObjectId('64e09b41656c004597013919')}
{'RatingValue': '5', '_id': ObjectId('64e09b41656c00459701391a')}
{'RatingValue': 'AwaitingInspection',
 '_id': ObjectId('64e09

{'RatingValue': 'Exempt', '_id': ObjectId('64e09b43656c004597014c77')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c78')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c79')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c7a')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c7b')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c7c')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c7d')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c7e')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c7f')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c80')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c81')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c82')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c83')}
{'RatingValue': '5', '_id': ObjectId('64e09b43656c004597014c84')}
{'RatingValue': '4', '_id': ObjectId('64e09b43656c004597014c85')}
{'Rat

{'RatingValue': 'Exempt', '_id': ObjectId('64e09b45656c004597016c95')}
{'RatingValue': 'Exempt', '_id': ObjectId('64e09b45656c004597016c96')}
{'RatingValue': '5', '_id': ObjectId('64e09b45656c004597016c97')}
{'RatingValue': '5', '_id': ObjectId('64e09b45656c004597016c98')}
{'RatingValue': '5', '_id': ObjectId('64e09b45656c004597016c99')}
{'RatingValue': '3', '_id': ObjectId('64e09b45656c004597016c9a')}
{'RatingValue': '5', '_id': ObjectId('64e09b45656c004597016c9b')}
{'RatingValue': '5', '_id': ObjectId('64e09b45656c004597016c9c')}
{'RatingValue': '4', '_id': ObjectId('64e09b45656c004597016c9d')}
{'RatingValue': '5', '_id': ObjectId('64e09b45656c004597016c9e')}
{'RatingValue': '5', '_id': ObjectId('64e09b45656c004597016c9f')}
{'RatingValue': '5', '_id': ObjectId('64e09b45656c004597016ca0')}
{'RatingValue': '5', '_id': ObjectId('64e09b45656c004597016ca1')}
{'RatingValue': '4', '_id': ObjectId('64e09b45656c004597016ca2')}
{'RatingValue': '5', '_id': ObjectId('64e09b45656c004597016ca3')}


{'RatingValue': '3', '_id': ObjectId('64e09b49656c004597018a6c')}
{'RatingValue': '5', '_id': ObjectId('64e09b49656c004597018a6d')}
{'RatingValue': '3', '_id': ObjectId('64e09b49656c004597018a6e')}
{'RatingValue': '4', '_id': ObjectId('64e09b49656c004597018a6f')}
{'RatingValue': '5', '_id': ObjectId('64e09b49656c004597018a70')}
{'RatingValue': '5', '_id': ObjectId('64e09b49656c004597018a71')}
{'RatingValue': '3', '_id': ObjectId('64e09b49656c004597018a72')}
{'RatingValue': '5', '_id': ObjectId('64e09b49656c004597018a73')}
{'RatingValue': 'AwaitingInspection',
 '_id': ObjectId('64e09b49656c004597018a74')}
{'RatingValue': '5', '_id': ObjectId('64e09b49656c004597018a75')}
{'RatingValue': '3', '_id': ObjectId('64e09b49656c004597018a76')}
{'RatingValue': 'AwaitingInspection',
 '_id': ObjectId('64e09b49656c004597018a77')}
{'RatingValue': '2', '_id': ObjectId('64e09b49656c004597018a78')}
{'RatingValue': '5', '_id': ObjectId('64e09b49656c004597018a79')}
{'RatingValue': '1', '_id': ObjectId('64

In [13]:
## MW - Step 2 - Results, after hours of trying to filter out 'AwaitingInspection... 
## MW - and trying to convert string to integer and then filter again on values greater than 4... 
## MW - What did I learn? I learned that That mongoDB's documentation is very confusing...
## MW - And that YES! mongoDB can perform filters on numbers stored as strings...
## MW - That's not best practice though.  Better to clean and transform, but you know - half a day wasted already on attempting to do just that.
rt_query = {'RatingValue': {'$gte':'4'}}
rt_query_count =est_p2.count_documents(rt_query)
print(rt_query_count)

36292


In [14]:
# Find the establishments with London as the Local Authority and has a RatingValue greater than or equal to 4.
## MW - So here I am, finally returned to the project questions.  
la_rt_query1 = {
    'LocalAuthorityName': {'$regex': 'London'},
    'RatingValue': {'$not' : {'$regex':'AwaitingInspection'}},
    'RatingValue':{'$gte':'4'}
    }
la_rt_query1_res = est_p2.find(la_rt_query1)  


In [15]:
# Use count_documents to display the number of documents in the result
la_rt_query1_count =est_p2.count_documents(la_rt_query1)
print(la_rt_query1_count)

34


In [16]:
# Convert the result to a Pandas DataFrame
la_rt_df = pd.DataFrame(la_rt_query1_res)

# Display the number of rows in the DataFrame
print("Rows in datafram ('la_rt_df'):", len(la_rt_df))

# Display the first 10 rows of the DataFrame
la_rt_df.head(10)

Rows in datafram ('la_rt_df'): 34


Unnamed: 0,_id,FHRSID,ChangesByServerID,LocalAuthorityBusinessID,BusinessName,BusinessType,BusinessTypeID,AddressLine1,AddressLine2,AddressLine3,...,LocalAuthorityWebSite,LocalAuthorityEmailAddress,scores,SchemeType,geocode,RightToReply,Distance,NewRatingPending,meta,links
0,64e09b41656c004597013882,621707,0,PI/000025307,Charlie's,Other catering premises,7841,Oak Apple Farm Building 103 Sheernes Docks,Sheppy Kent,,...,http://www.cityoflondon.gov.uk/Corporation/hom...,publicprotection@cityoflondon.gov.uk,"{'Hygiene': 5, 'Structural': 10, 'ConfidenceIn...",FHRS,"{'longitude': 0.508551, 'latitude': 51.369321}",,4627.439468,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'https://api.ratings...."
1,64e09b42656c004597013ba8,1130836,0,PI/000034075,Mv City Cruises Erasmus,Other catering premises,7841,Cherry Garden Pier,Cherry Garden Street Rotherhithe,Charlton,...,http://www.cityoflondon.gov.uk/Corporation/hom...,publicprotection@cityoflondon.gov.uk,"{'Hygiene': 0, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.249255999922752, 'latitude': 5...",,4627.873179,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
2,64e09b42656c0045970146f7,293783,0,PI/000002614,Benfleet Motor Yacht Club,Other catering premises,7841,Ferry Road,South Benfleet Essex,,...,http://www.cityoflondon.gov.uk/Corporation/hom...,publicprotection@cityoflondon.gov.uk,"{'Hygiene': 0, 'Structural': 0, 'ConfidenceInM...",FHRS,"{'longitude': 0.561954, 'latitude': 51.543831}",,4631.968418,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
3,64e09b43656c0045970154f6,1315095,0,PI/000036464,Coombs Catering t/a The Lock and Key,Restaurant/Cafe/Canteen,1,Leslie Ford House,Tilbury,Charlton,...,http://www.cityoflondon.gov.uk/Corporation/hom...,publicprotection@cityoflondon.gov.uk,"{'Hygiene': 0, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.346336990594864, 'latitude': 5...",,4636.846754,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
4,64e09b43656c0045970154f7,294474,0,PI/000014647,Tilbury Seafarers Centre,Restaurant/Cafe/Canteen,1,Tenants Row Tilbury Docks,Tilbury Essex,,...,http://www.cityoflondon.gov.uk/Corporation/hom...,publicprotection@cityoflondon.gov.uk,"{'Hygiene': 0, 'Structural': 0, 'ConfidenceInM...",FHRS,"{'longitude': 0.346325, 'latitude': 51.464078}",,4636.84765,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
5,64e09b44656c004597015c01,294900,0,PI/000019066,Mv Valulla,Other catering premises,7841,Reeds River Cruises LtdKings ReachRiver Thames...,London,,...,http://www.cityoflondon.gov.uk/Corporation/hom...,publicprotection@cityoflondon.gov.uk,"{'Hygiene': 0, 'Structural': 0, 'ConfidenceInM...",FHRS,"{'longitude': 0.287555, 'latitude': 51.504071}",,4640.460834,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
6,64e09b48656c004597017d09,1252616,0,PI/000035653,Froottree,Other catering premises,7841,Tereza Joanne King George V Lock,Woolwich Manor Way London,Charlton,...,http://www.cityoflondon.gov.uk/Corporation/hom...,publicprotection@cityoflondon.gov.uk,"{'Hygiene': None, 'Structural': None, 'Confide...",FHRS,"{'longitude': 0.0693250000476837, 'latitude': ...",,4648.3,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
7,64e09b48656c004597017d0f,293756,0,PI/000002538,Tereza Joanne,Other catering premises,7841,Funcraft UK Ltd King George V Dock Woolwich Ma...,London,,...,http://www.cityoflondon.gov.uk/Corporation/hom...,publicprotection@cityoflondon.gov.uk,"{'Hygiene': 0, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.069286, 'latitude': 51.501121}",,4648.301822,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
8,64e09b48656c0045970180d5,878523,0,PI/000029844,Brick Lane Brews,Restaurant/Cafe/Canteen,1,Air side London City Airport,London,,...,http://www.cityoflondon.gov.uk/Corporation/hom...,publicprotection@cityoflondon.gov.uk,"{'Hygiene': 10, 'Structural': 5, 'ConfidenceIn...",FHRS,"{'longitude': 0.048006, 'latitude': 51.503733}",,4649.173485,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
9,64e09b48656c0045970180ed,293772,0,PI/000002585,The Nuance Group (UK) Limited,Retailers - other,4613,Duty Free Shop Passenger Terminal,London City AirportRoyal DocksLondon,,...,http://www.cityoflondon.gov.uk/Corporation/hom...,publicprotection@cityoflondon.gov.uk,"{'Hygiene': 0, 'Structural': 0, 'ConfidenceInM...",FHRS,"{'longitude': 0.047966, 'latitude': 51.504112}",,4649.188826,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."


### 3. What are the top 5 establishments with a `RatingValue` rating value of '5', sorted by lowest hygiene score, nearest to the new restaurant added, "Penang Flavours"?

In [17]:
## MW - Find establishment in 'Greenwich' to determine its latitude and longitude
WheresGreenwich = est_p2.find_one({'AddressLine3' : 'Greenwich'})
pprint(WheresGreenwich)


{'AddressLine1': '827 Woolwich Road',
 'AddressLine2': '',
 'AddressLine3': 'Greenwich',
 'AddressLine4': '',
 'BusinessName': 'Millennium Cafe',
 'BusinessType': 'Restaurant/Cafe/Canteen',
 'BusinessTypeID': 1,
 'ChangesByServerID': 0,
 'Distance': 4648.880834143303,
 'FHRSID': 694956,
 'LocalAuthorityBusinessID': 'PI/000167440',
 'LocalAuthorityCode': '511',
 'LocalAuthorityEmailAddress': 'health@royalgreenwich.gov.uk',
 'LocalAuthorityName': 'Greenwich',
 'LocalAuthorityWebSite': 'http://www.royalgreenwich.gov.uk',
 'NewRatingPending': False,
 'Phone': '',
 'PostCode': 'SE7 8LJ',
 'RatingDate': '2020-07-29T00:00:00',
 'RatingKey': 'fhrs_4_en-gb',
 'RatingValue': '4',
 'RightToReply': '',
 'SchemeType': 'FHRS',
 '_id': ObjectId('64e09b48656c004597017f9c'),
 'geocode': {'latitude': Decimal128('51.4925572'),
             'longitude': Decimal128('0.0448072')},
 'links': [{'href': 'http://api.ratings.food.gov.uk/establishments/694956',
            'rel': 'self'}],
 'meta': {'dataSource':

In [18]:
# Search within 0.01 degree on either side of the latitude and longitude.
# Rating value must equal 5
# Sort by hygiene score

degree_search = 0.01
latitude = 51.4925572
longitude = 0.0448072

query = {'geocode.latitude': {'$gte': latitude-degree_search,'$lte': latitude+degree_search},
        'geocode.longitude': {'$gte': longitude-degree_search,'$lte': longitude+degree_search},
        'RatingValue':{'$eq':'5'}}

sort = [('scores.Hygiene',-1)]

fields = {'BusinessName':1, 'RatingValue':1,'scores.Hygiene':1,'geocode.latitude':1,'geocode.longitude':1}

limit = 5

# Print the results
pprint(list(est_p2.find(query, fields).sort(sort).limit(limit)))


[{'BusinessName': "CJ's Snackbar",
  'RatingValue': '5',
  '_id': ObjectId('64e09b48656c004597017dbd'),
  'geocode': {'latitude': Decimal128('51.486335182214'),
              'longitude': Decimal128('0.0490357238143205')},
  'scores': {'Hygiene': 5}},
 {'BusinessName': 'Neelas Home Ltd',
  'RatingValue': '5',
  '_id': ObjectId('64e09b48656c004597017efd'),
  'geocode': {'latitude': Decimal128('51.4933031'),
              'longitude': Decimal128('0.0505023')},
  'scores': {'Hygiene': 5}},
 {'BusinessName': 'Choice Support',
  'RatingValue': '5',
  '_id': ObjectId('64e09b48656c004597017e73'),
  'geocode': {'latitude': Decimal128('51.4906817'),
              'longitude': Decimal128('0.0502405')},
  'scores': {'Hygiene': 5}},
 {'BusinessName': 'Cardwell Primary School',
  'RatingValue': '5',
  '_id': ObjectId('64e09b48656c004597017db8'),
  'geocode': {'latitude': Decimal128('51.4907377'),
              'longitude': Decimal128('0.0535172')},
  'scores': {'Hygiene': 5}},
 {'BusinessName': '3D

In [19]:
# Convert result to Pandas DataFrame
t5est_hyg = list(est_p2.find(query, fields).sort(sort).limit(limit))
t5est_hyg_df = pd.DataFrame(t5est_hyg)
t5est_hyg_df.head()

Unnamed: 0,_id,BusinessName,RatingValue,scores,geocode
0,64e09b48656c004597017dbd,CJ's Snackbar,5,{'Hygiene': 5},"{'longitude': 0.0490357238143205, 'latitude': ..."
1,64e09b48656c004597017efd,Neelas Home Ltd,5,{'Hygiene': 5},"{'longitude': 0.0505023, 'latitude': 51.4933031}"
2,64e09b48656c004597017e73,Choice Support,5,{'Hygiene': 5},"{'longitude': 0.0502405, 'latitude': 51.4906817}"
3,64e09b48656c004597017db8,Cardwell Primary School,5,{'Hygiene': 5},"{'longitude': 0.0535172, 'latitude': 51.4907377}"
4,64e09b48656c004597017d70,3DM Wine,5,{'Hygiene': 5},"{'longitude': 0.0525002, 'latitude': 51.4880703}"


### 4. How many establishments in each Local Authority area have a hygiene score of 0?

In [20]:
## MW - check value type of scores.Hygiene field.
check = est_p2.find({},{'scores.Hygiene':1})

for i in check:
    pprint(i)

{'_id': ObjectId('64e09b3b656c004597010051'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b3b656c004597010052'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b3b656c004597010053'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b3b656c004597010054'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b3b656c004597010055'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b3b656c004597010056'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3b656c004597010057'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3b656c004597010058'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b3b656c004597010059'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b3b656c00459701005a'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b3b656c00459701005b'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3b656c00459701005c'), 'scores': {'Hygiene': None}}
{'_id': ObjectId('64e09b3b656c00459701005d'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b3b656c00459701005e'), 'scores': {'Hyg

{'_id': ObjectId('64e09b3d656c0045970118b3'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118b4'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118b5'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118b6'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118b7'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118b8'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118b9'), 'scores': {'Hygiene': None}}
{'_id': ObjectId('64e09b3d656c0045970118ba'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118bb'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118bc'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118bd'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118be'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118bf'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b3d656c0045970118c0'), 'scores': {'Hyg

{'_id': ObjectId('64e09b40656c004597012be5'), 'scores': {'Hygiene': 10}}
{'_id': ObjectId('64e09b40656c004597012be6'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b40656c004597012be7'), 'scores': {'Hygiene': 10}}
{'_id': ObjectId('64e09b40656c004597012be8'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b40656c004597012be9'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b40656c004597012bea'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b40656c004597012beb'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b40656c004597012bec'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b40656c004597012bed'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b40656c004597012bee'), 'scores': {'Hygiene': None}}
{'_id': ObjectId('64e09b40656c004597012bef'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b40656c004597012bf0'), 'scores': {'Hygiene': 15}}
{'_id': ObjectId('64e09b40656c004597012bf1'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b40656c004597012bf2'), 'scores': {'

{'_id': ObjectId('64e09b42656c0045970140b3'), 'scores': {'Hygiene': 10}}
{'_id': ObjectId('64e09b42656c0045970140b4'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b42656c0045970140b5'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b42656c0045970140b6'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b42656c0045970140b7'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b42656c0045970140b8'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b42656c0045970140b9'), 'scores': {'Hygiene': None}}
{'_id': ObjectId('64e09b42656c0045970140ba'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b42656c0045970140bb'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b42656c0045970140bc'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b42656c0045970140bd'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b42656c0045970140be'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b42656c0045970140bf'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b42656c0045970140c0'), 'scores': {'Hy

{'_id': ObjectId('64e09b43656c00459701547b'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b43656c00459701547c'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b43656c00459701547d'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b43656c00459701547e'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b43656c00459701547f'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b43656c004597015480'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b43656c004597015481'), 'scores': {'Hygiene': None}}
{'_id': ObjectId('64e09b43656c004597015482'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b43656c004597015483'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b43656c004597015484'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b43656c004597015485'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b43656c004597015486'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b43656c004597015487'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b43656c004597015488'), 'scores': {'Hyg

{'_id': ObjectId('64e09b45656c0045970169cf'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b45656c0045970169d0'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b45656c0045970169d1'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b45656c0045970169d2'), 'scores': {'Hygiene': 15}}
{'_id': ObjectId('64e09b45656c0045970169d3'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b45656c0045970169d4'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b45656c0045970169d5'), 'scores': {'Hygiene': 10}}
{'_id': ObjectId('64e09b45656c0045970169d6'), 'scores': {'Hygiene': None}}
{'_id': ObjectId('64e09b45656c0045970169d7'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b45656c0045970169d8'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b45656c0045970169d9'), 'scores': {'Hygiene': 10}}
{'_id': ObjectId('64e09b45656c0045970169da'), 'scores': {'Hygiene': 10}}
{'_id': ObjectId('64e09b45656c0045970169db'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b45656c0045970169dc'), 'scores': {

{'_id': ObjectId('64e09b48656c0045970182b7'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b48656c0045970182b8'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b48656c0045970182b9'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b48656c0045970182ba'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b48656c0045970182bb'), 'scores': {'Hygiene': 10}}
{'_id': ObjectId('64e09b48656c0045970182bc'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b48656c0045970182bd'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b48656c0045970182be'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b48656c0045970182bf'), 'scores': {'Hygiene': None}}
{'_id': ObjectId('64e09b48656c0045970182c0'), 'scores': {'Hygiene': 10}}
{'_id': ObjectId('64e09b48656c0045970182c1'), 'scores': {'Hygiene': None}}
{'_id': ObjectId('64e09b48656c0045970182c2'), 'scores': {'Hygiene': 0}}
{'_id': ObjectId('64e09b48656c0045970182c3'), 'scores': {'Hygiene': 5}}
{'_id': ObjectId('64e09b48656c0045970182c4'), 'scores': 

In [21]:
# Create a pipeline that: 
# 1. Matches establishments with a hygiene score of 0
# 2. Groups the matches by Local Authority
# 3. Sorts the matches from highest to lowest

match = {'$match': {'scores.Hygiene': 0}}
group = {'$group': {'_id': '$LocalAuthorityName', 'count': { '$sum': 1 }}}
sort = {'$sort': { 'count': -1 }}

pipeline = [match, group, sort]
la_hyg0 = list(est_p2.aggregate(pipeline))

# Print the number of documents in the result
print("No. of documents in result: ", len(la_hyg0))

# Print the first 10 results
pprint(la_hyg0[0:10])

No. of documents in result:  56
[{'_id': 'Thanet', 'count': 1130},
 {'_id': 'Greenwich', 'count': 882},
 {'_id': 'Maidstone', 'count': 713},
 {'_id': 'Newham', 'count': 711},
 {'_id': 'Swale', 'count': 686},
 {'_id': 'Chelmsford', 'count': 680},
 {'_id': 'Medway', 'count': 672},
 {'_id': 'Bexley', 'count': 607},
 {'_id': 'Southend-On-Sea', 'count': 586},
 {'_id': 'Tendring', 'count': 542}]


In [22]:
# Convert the result to a Pandas DataFrame
la_hyg0_df = pd.DataFrame(la_hyg0)

# Display the number of rows in the DataFrame
print("No. of rows in dataframe ('la_hyg0_df'):", len(la_hyg0_df))

# Display the first 10 rows of the DataFrame
la_hyg0_df.head(10)

No. of rows in dataframe ('la_hyg0_df'): 56


Unnamed: 0,_id,count
0,Thanet,1130
1,Greenwich,882
2,Maidstone,713
3,Newham,711
4,Swale,686
5,Chelmsford,680
6,Medway,672
7,Bexley,607
8,Southend-On-Sea,586
9,Tendring,542
