# Eat Safe, Love

## Notebook Set Up

In [2]:
# Import dependencies
from pymongo import MongoClient
from pprint import pprint
import pandas as pd
import json

In [3]:
# Create an instance of MongoClient
mongo = MongoClient(port=27017)

In [4]:
print(mongo.list_database_names())

['admin', 'config', 'local', 'met', 'uk_food']


In [5]:
# assign the uk_food database to a variable name
db = mongo['uk_food']

In [6]:
# review the collections in our database
db.list_collection_names()

['establishments']

In [7]:
# assign the collection to a variable
establishments = db['establishments']

## Part 3: Exploratory Analysis
Unless otherwise stated, for each question: 
* Use `count_documents` to display the number of documents contained in the result.
* Display the first document in the results using `pprint`.
* Convert the result to a Pandas DataFrame, print the number of rows in the DataFrame, and display the first 10 rows.

### 1. Which establishments have a hygiene score equal to 20?

In [8]:
establishments.find_one()

{'_id': ObjectId('65c941a5c7bd9d7ecc36ecb0'),
 'FHRSID': 647177,
 'ChangesByServerID': 0,
 'LocalAuthorityBusinessID': 'PI/000041489',
 'BusinessName': 'Wear Bay Bowls Club',
 'BusinessType': 'Pub/bar/nightclub',
 'BusinessTypeID': 7843,
 'AddressLine1': 'Wear Bay Road',
 'AddressLine2': 'Folkestone',
 'AddressLine3': 'Kent',
 'AddressLine4': '',
 'PostCode': 'CT19 6PY',
 'Phone': '',
 'RatingValue': 4,
 'RatingKey': 'fhrs_4_en-gb',
 'RatingDate': '2014-03-31T00:00:00',
 'LocalAuthorityCode': '188',
 'LocalAuthorityName': 'Folkestone and Hythe',
 'LocalAuthorityWebSite': 'http://www.folkestone-hythe.gov.uk',
 'LocalAuthorityEmailAddress': 'foodteam@folkestone-hythe.gov.uk',
 'scores': {'Hygiene': 5, 'Structural': 5, 'ConfidenceInManagement': 10},
 'SchemeType': 'FHRS',
 'geocode': {'longitude': 1.196408, 'latitude': 51.086058},
 'RightToReply': '',
 'Distance': 4591.821311183521,
 'NewRatingPending': False,
 'meta': {'dataSource': None,
  'extractDate': '0001-01-01T00:00:00',
  'itemCo

In [9]:
# Find the establishments with a hygiene score of 20
query = {"scores.Hygiene" : {'$gt' : 20}}
col_hy_gt_20 = [x for x in establishments.find(query)]
# Use count_documents to display the number of documents in the result
count = establishments.count_documents(query)
print(count)
# Display the first document in the results using pprint
pprint(col_hy_gt_20)

7
[{'AddressLine1': 'Skyline Hotel',
  'AddressLine2': 'Chelmsford Road',
  'AddressLine3': 'Barnston',
  'AddressLine4': 'Dunmow',
  'BusinessName': 'Inferno',
  'BusinessType': 'Takeaway/sandwich shop',
  'BusinessTypeID': 7844,
  'ChangesByServerID': 0,
  'Distance': 4650.02974294374,
  'FHRSID': 1349147,
  'LocalAuthorityBusinessID': '21/00036/COM',
  'LocalAuthorityCode': '122',
  'LocalAuthorityEmailAddress': 'environmentalhealth@uttlesford.gov.uk',
  'LocalAuthorityName': 'Uttlesford',
  'LocalAuthorityWebSite': 'http://www.uttlesford.gov.uk',
  'NewRatingPending': False,
  'Phone': '',
  'PostCode': 'CM6 1LP',
  'RatingDate': '2022-01-27T00:00:00',
  'RatingKey': 'fhrs_0_en-gb',
  'RatingValue': 0,
  'RightToReply': '',
  'SchemeType': 'FHRS',
  '_id': ObjectId('65c941a7c7bd9d7ecc376e62'),
  'geocode': {'latitude': 51.85643, 'longitude': 0.383023},
  'links': [{'href': 'http://api.ratings.food.gov.uk/establishments/1349147',
             'rel': 'self'}],
  'meta': {'dataSource'

In [10]:
# Convert the result to a Pandas DataFrame
df = pd.DataFrame(col_hy_gt_20)
# Display the number of rows in the DataFrame
row_count = df.shape[0]
row_count
# Display the first 10 rows of the DataFrame
df.head()

Unnamed: 0,_id,FHRSID,ChangesByServerID,LocalAuthorityBusinessID,BusinessName,BusinessType,BusinessTypeID,AddressLine1,AddressLine2,AddressLine3,...,LocalAuthorityWebSite,LocalAuthorityEmailAddress,scores,SchemeType,geocode,RightToReply,Distance,NewRatingPending,meta,links
0,65c941a7c7bd9d7ecc376e62,1349147,0,21/00036/COM,Inferno,Takeaway/sandwich shop,7844,Skyline Hotel,Chelmsford Road,Barnston,...,http://www.uttlesford.gov.uk,environmentalhealth@uttlesford.gov.uk,"{'Hygiene': 25, 'Structural': 20, 'ConfidenceI...",FHRS,"{'longitude': 0.383023, 'latitude': 51.85643}",,4650.029743,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
1,65c941a7c7bd9d7ecc377899,785554,0,08/00054/FOOD,Stratford News And Wines,Retailers - other,4613,107 Romford Road,Stratford,London,...,https://www.newham.gov.uk,food@newham.gov.uk,"{'Hygiene': 25, 'Structural': 15, 'ConfidenceI...",FHRS,"{'longitude': 0.008382, 'latitude': 51.542772}",,4652.047527,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
2,65c941a7c7bd9d7ecc377a51,514156,0,147,The Plough & Harrow,Pub/bar/nightclub,7843,,419 High Road Leytonstone,,...,http://www.walthamforest.gov.uk,environmentalhealth@walthamforest.gov.uk,"{'Hygiene': 25, 'Structural': 25, 'ConfidenceI...",FHRS,"{'longitude': 0.006434, 'latitude': 51.558138}",,4652.681025,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
3,65c941a7c7bd9d7ecc377a5e,514651,0,47178,Chicks,Takeaway/sandwich shop,7844,,497 High Road,,...,http://www.walthamforest.gov.uk,environmentalhealth@walthamforest.gov.uk,"{'Hygiene': 25, 'Structural': 25, 'ConfidenceI...",FHRS,"{'longitude': 0.0071334, 'latitude': 51.5593505}",,4652.699935,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
4,65c941a7c7bd9d7ecc377a95,514221,0,17220,The Continental Food Exchange/TFC Leytonstone,Retailers - other,4613,,647-661 High Road Leytonstone,,...,http://www.walthamforest.gov.uk,environmentalhealth@walthamforest.gov.uk,"{'Hygiene': 25, 'Structural': 25, 'ConfidenceI...",FHRS,"{'longitude': 0.009602, 'latitude': 51.563902}",,4652.776654,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."


### 2. Which establishments in London have a `RatingValue` greater than or equal to 4?

In [11]:
establishments.find_one()

{'_id': ObjectId('65c941a5c7bd9d7ecc36ecb0'),
 'FHRSID': 647177,
 'ChangesByServerID': 0,
 'LocalAuthorityBusinessID': 'PI/000041489',
 'BusinessName': 'Wear Bay Bowls Club',
 'BusinessType': 'Pub/bar/nightclub',
 'BusinessTypeID': 7843,
 'AddressLine1': 'Wear Bay Road',
 'AddressLine2': 'Folkestone',
 'AddressLine3': 'Kent',
 'AddressLine4': '',
 'PostCode': 'CT19 6PY',
 'Phone': '',
 'RatingValue': 4,
 'RatingKey': 'fhrs_4_en-gb',
 'RatingDate': '2014-03-31T00:00:00',
 'LocalAuthorityCode': '188',
 'LocalAuthorityName': 'Folkestone and Hythe',
 'LocalAuthorityWebSite': 'http://www.folkestone-hythe.gov.uk',
 'LocalAuthorityEmailAddress': 'foodteam@folkestone-hythe.gov.uk',
 'scores': {'Hygiene': 5, 'Structural': 5, 'ConfidenceInManagement': 10},
 'SchemeType': 'FHRS',
 'geocode': {'longitude': 1.196408, 'latitude': 51.086058},
 'RightToReply': '',
 'Distance': 4591.821311183521,
 'NewRatingPending': False,
 'meta': {'dataSource': None,
  'extractDate': '0001-01-01T00:00:00',
  'itemCo

In [28]:
# Find the establishments 
query_rate = {'RatingValue' : {'$gte': 4}, 'AddressLine4' : {'$regex':'London'}}
# col_rate_gte4 = [x for x in establishments.find(query_rate)]
col_rate_gte4 = establishments.find(query_rate)
# Use count_documents to display the number of documents in the result
count_rate = establishments.count_documents(query_rate)
print("Number of documents with rating >= 4:", count_rate)
# Display the first document in the results using pprint
pprint([x for x in establishments.find(query_rate)])

Number of documents with rating >= 4: 390
[{'AddressLine1': 'Arch D',
  'AddressLine2': 'The Link Thamesmead',
  'AddressLine3': 'Bazalgette Way',
  'AddressLine4': 'London',
  'BusinessName': 'The Mezzanine Cafe',
  'BusinessType': 'Restaurant/Cafe/Canteen',
  'BusinessTypeID': 1,
  'ChangesByServerID': 0,
  'Distance': 4646.357884390823,
  'FHRSID': 1049722,
  'LocalAuthorityBusinessID': '18/00096/CP',
  'LocalAuthorityCode': '503',
  'LocalAuthorityEmailAddress': 'food.safety@bexley.gov.uk',
  'LocalAuthorityName': 'Bexley',
  'LocalAuthorityWebSite': 'http://www.bexley.gov.uk',
  'NewRatingPending': False,
  'Phone': '',
  'PostCode': 'SE2 9BS',
  'RatingDate': '2022-05-24T00:00:00',
  'RatingKey': 'fhrs_4_en-gb',
  'RatingValue': 4,
  'RightToReply': '',
  'SchemeType': 'FHRS',
  '_id': ObjectId('65c941a7c7bd9d7ecc375c95'),
  'geocode': {'latitude': 51.5002632141113, 'longitude': 0.121751002967358},
  'links': [{'href': 'http://api.ratings.food.gov.uk/establishments/1049722',
    

In [23]:
# Convert the result to a Pandas DataFrame
df_rate_value = pd.DataFrame(col_rate_gte4)
# Display the number of rows in the DataFrame
row_count = df_rate_value.shape[0]
row_count
# Display the first 10 rows of the DataFrame
df_rate_value.head(10)

Unnamed: 0,_id,FHRSID,ChangesByServerID,LocalAuthorityBusinessID,BusinessName,BusinessType,BusinessTypeID,AddressLine1,AddressLine2,AddressLine3,...,LocalAuthorityWebSite,LocalAuthorityEmailAddress,scores,SchemeType,geocode,RightToReply,Distance,NewRatingPending,meta,links
0,65c941a7c7bd9d7ecc375c95,1049722,0,18/00096/CP,The Mezzanine Cafe,Restaurant/Cafe/Canteen,1,Arch D,The Link Thamesmead,Bazalgette Way,...,http://www.bexley.gov.uk,food.safety@bexley.gov.uk,"{'Hygiene': 10, 'Structural': 0, 'ConfidenceIn...",FHRS,"{'longitude': 0.121751002967358, 'latitude': 5...",,4646.357884,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
1,65c941a7c7bd9d7ecc375cb3,1261451,0,20/00255/MIXED,"St Edward's Church, Mottingham - StEP Lunch Cl...",Other catering premises,7841,St Edwards Church Hall,St Keverne Road,Mottingham,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 0, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.04774, 'latitude': 51.428019}",,4646.410908,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
2,65c941a7c7bd9d7ecc375cba,987733,0,16/00340/MIXED,Maryfield Pre-School 2,Caring Premises,5,Mottingham Community Centre,Kimmeridge Road,Mottingham,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 5, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.0465259999036789, 'latitude': ...",,4646.414831,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
3,65c941a7c7bd9d7ecc375cbc,357627,0,00000/0000/8/951,Co-op,Retailers - supermarkets/hypermarkets,7840,The Co-operative Food,Kimmeridge Road,Mottingham,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 0, 'Structural': 0, 'ConfidenceInM...",FHRS,"{'longitude': 0.0465259999036789, 'latitude': ...",,4646.414831,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
4,65c941a7c7bd9d7ecc375cda,1151706,0,00000/0000/8/204,North Hub @ Castlecombe Youth Centre,Caring Premises,5,Castlecombe Youth Centre,Castlecombe Road,Mottingham,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 5, 'Structural': 10, 'ConfidenceIn...",FHRS,"{'longitude': 0.0433179996907711, 'latitude': ...",,4646.439635,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
5,65c941a7c7bd9d7ecc375cdd,1468037,0,22/00180/MIXED,Spencers,Retailers - other,4613,11 Cranley Parade,Kimmeridge Road,Mottingham,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 0, 'Structural': 10, 'ConfidenceIn...",FHRS,"{'longitude': 0.046141, 'latitude': 51.427318}",,4646.443677,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
6,65c941a7c7bd9d7ecc375ce0,358232,0,02/00010/MIXED,Domino's Pizza,Takeaway/sandwich shop,7844,3 Cranley Parade,Beaconsfield Road,Mottingham,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 5, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.046141, 'latitude': 51.427318}",,4646.443677,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
7,65c941a7c7bd9d7ecc375ce8,1415217,0,21/00630/MIXED,Papa John's Pizza,Takeaway/sandwich shop,7844,4 Cranley Parade,Beaconsfield Road,Mottingham,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 0, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.0460971, 'latitude': 51.4273993}",,4646.448256,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
8,65c941a7c7bd9d7ecc375cfb,635108,0,14/00056/MIXED,Perfect Cafe,Restaurant/Cafe/Canteen,1,11 Beaconsfield Parade,Beaconsfield Road,Mottingham,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 0, 'Structural': 0, 'ConfidenceInM...",FHRS,"{'longitude': 0.045445, 'latitude': 51.427186}",,4646.464277,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
9,65c941a7c7bd9d7ecc375cfd,357579,0,00000/0000/8/062,Superfry Fish Bar,Takeaway/sandwich shop,7844,12 Beaconsfield Parade,Beaconsfield Road,Mottingham,...,http://www.bromley.gov.uk,food@bromley.gov.uk,"{'Hygiene': 10, 'Structural': 5, 'ConfidenceIn...",FHRS,"{'longitude': 0.045445, 'latitude': 51.427186}",,4646.464277,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."


### 3. What are the top 5 establishments with a `RatingValue` rating value of 5, sorted by lowest hygiene score, nearest to the new restaurant added, "Penang Flavours"?

In [14]:
query = {'BusinessName' : 'Penang Flavours'}
establishments.find_one(query)

{'_id': ObjectId('65c941a86cb35683baa36ffc'),
 'BusinessName': 'Penang Flavours',
 'BusinessType': 'Restaurant/Cafe/Canteen',
 'BusinessTypeID': 1,
 'AddressLine1': 'Penang Flavours',
 'AddressLine2': '146A Plumstead Rd',
 'AddressLine3': 'London',
 'AddressLine4': '',
 'PostCode': 'SE18 7DY',
 'Phone': '',
 'LocalAuthorityCode': '511',
 'LocalAuthorityName': 'Greenwich',
 'LocalAuthorityWebSite': 'http://www.royalgreenwich.gov.uk',
 'LocalAuthorityEmailAddress': 'health@royalgreenwich.gov.uk',
 'scores': {'Hygiene': '', 'Structural': '', 'ConfidenceInManagement': ''},
 'SchemeType': 'FHRS',
 'geocode': {'longitude': 0.08384, 'latitude': 51.490142},
 'RightToReply': '',
 'Distance': 4623.972328074718,
 'NewRatingPending': True,
 'RatingValue': None}

In [29]:
# Search within 0.01 degree on either side of the latitude and longitude.
degree_search = 0.01
#Find long and lat 
latitude = float(establishments.find_one({'BusinessName': 'Penang Flavours'}, {'geocode.latitude'})['geocode']['latitude'])
longitude = float(establishments.find_one({'BusinessName': 'Penang Flavours'}, {'geocode.longitude'})['geocode']['longitude'])
#Define the latitude and longitude ranges for the search
latitude_range = [latitude - degree_search, latitude + degree_search]
longitude_range = [longitude - degree_search, longitude + degree_search]

top_5_establishments =  [x for x in establishments.find(
    {
        "geocode.latitude": {"$gte": latitude_range[0], "$lte": latitude_range[1]},
        "geocode.longitude": {"$gte": longitude_range[0], "$lte": longitude_range[1]},
        "RatingValue": 5  
    },
    sort =  [('scores.Hygiene', 1)] 
).limit(5)]
# Print the results
pprint(top_5_establishments)

[{'AddressLine1': '130 - 132 Plumstead High Street',
  'AddressLine2': '',
  'AddressLine3': 'Plumstead',
  'AddressLine4': 'Greenwich',
  'BusinessName': 'Volunteer',
  'BusinessType': 'Pub/bar/nightclub',
  'BusinessTypeID': 7843,
  'ChangesByServerID': 0,
  'Distance': 4646.965634598608,
  'FHRSID': 694609,
  'LocalAuthorityBusinessID': 'PI/000116619',
  'LocalAuthorityCode': '511',
  'LocalAuthorityEmailAddress': 'health@royalgreenwich.gov.uk',
  'LocalAuthorityName': 'Greenwich',
  'LocalAuthorityWebSite': 'http://www.royalgreenwich.gov.uk',
  'NewRatingPending': False,
  'Phone': '',
  'PostCode': 'SE18 1JQ',
  'RatingDate': '2019-08-05T00:00:00',
  'RatingKey': 'fhrs_5_en-gb',
  'RatingValue': 5,
  'RightToReply': '',
  'SchemeType': 'FHRS',
  '_id': ObjectId('65c941a7c7bd9d7ecc376042'),
  'geocode': {'latitude': 51.4873437, 'longitude': 0.09208},
  'links': [{'href': 'http://api.ratings.food.gov.uk/establishments/694609',
             'rel': 'self'}],
  'meta': {'dataSource': N

In [30]:
# Convert result to Pandas DataFrame
df_top5 = pd.DataFrame([x for x in top_5_establishments])
df_top5.head()

Unnamed: 0,_id,FHRSID,ChangesByServerID,LocalAuthorityBusinessID,BusinessName,BusinessType,BusinessTypeID,AddressLine1,AddressLine2,AddressLine3,...,LocalAuthorityWebSite,LocalAuthorityEmailAddress,scores,SchemeType,geocode,RightToReply,Distance,NewRatingPending,meta,links
0,65c941a7c7bd9d7ecc376042,694609,0,PI/000116619,Volunteer,Pub/bar/nightclub,7843,130 - 132 Plumstead High Street,,Plumstead,...,http://www.royalgreenwich.gov.uk,health@royalgreenwich.gov.uk,"{'Hygiene': 0, 'Structural': 0, 'ConfidenceInM...",FHRS,"{'longitude': 0.09208, 'latitude': 51.4873437}",,4646.965635,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
1,65c941a7c7bd9d7ecc376060,694478,0,PI/000086506,Atlantic Fish Bar,Takeaway/sandwich shop,7844,35 Lakedale Road,,Plumstead,...,http://www.royalgreenwich.gov.uk,health@royalgreenwich.gov.uk,"{'Hygiene': 0, 'Structural': 0, 'ConfidenceInM...",FHRS,"{'longitude': 0.0912164, 'latitude': 51.4867296}",,4646.974612,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
2,65c941a7c7bd9d7ecc376064,909912,0,PI/000201100,Lumbini Grocery Ltd T/A Al-Iman,Retailers - other,4613,17 Lakedale Road,,Plumstead,...,http://www.royalgreenwich.gov.uk,health@royalgreenwich.gov.uk,"{'Hygiene': 0, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.0916256, 'latitude': 51.4871632}",,4646.975587,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
3,65c941a7c7bd9d7ecc376016,695223,0,PI/000178842,Iceland,Retailers - supermarkets/hypermarkets,7840,144 - 146 Plumstead High Street,,Plumstead,...,http://www.royalgreenwich.gov.uk,health@royalgreenwich.gov.uk,"{'Hygiene': 0, 'Structural': 5, 'ConfidenceInM...",FHRS,"{'longitude': 0.0924199968576431, 'latitude': ...",,4646.946071,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."
4,65c941a7c7bd9d7ecc376024,1380578,0,14425,Howe and Co Fish and Chips - Van 17,Mobile caterer,7846,Restaurant And Premises 107A Plumstead High St...,,Plumstead,...,http://www.royalgreenwich.gov.uk,health@royalgreenwich.gov.uk,"{'Hygiene': 0, 'Structural': 0, 'ConfidenceInM...",FHRS,"{'longitude': 0.0925370007753372, 'latitude': ...",,4646.955931,False,"{'dataSource': None, 'extractDate': '0001-01-0...","[{'rel': 'self', 'href': 'http://api.ratings.f..."


### 4. How many establishments in each Local Authority area have a hygiene score of 0?

In [17]:
# Create a pipeline that: 
# 1. Matches establishments with a hygiene score of 0
# 2. Groups the matches by Local Authority
# 3. Sorts the matches from highest to lowest
macth_query = {'$match':{'scores.Hygiene': 0}}
group_query = {'$group' : {'_id' : "$LocalAuthorityName","count" : {"$sum" : 1}}}
sort_value = {'$sort' : {"count" : -1}}
#put the pipeline together
pipeline = [macth_query,group_query,sort_value]
results = [x for x in list(establishments.aggregate(pipeline))]
# Print the number of documents in the result
result_list = list(results)
print("Number of documents in the result:", len(result_list))
# Print the first 10 results
pprint(results)

Number of documents in the result: 55
[{'_id': 'Thanet', 'count': 1130},
 {'_id': 'Greenwich', 'count': 882},
 {'_id': 'Maidstone', 'count': 713},
 {'_id': 'Newham', 'count': 711},
 {'_id': 'Swale', 'count': 686},
 {'_id': 'Chelmsford', 'count': 680},
 {'_id': 'Medway', 'count': 672},
 {'_id': 'Bexley', 'count': 607},
 {'_id': 'Southend-On-Sea', 'count': 586},
 {'_id': 'Tendring', 'count': 542},
 {'_id': 'Colchester', 'count': 498},
 {'_id': 'Tunbridge Wells', 'count': 491},
 {'_id': 'Folkestone and Hythe', 'count': 480},
 {'_id': 'Eastbourne', 'count': 478},
 {'_id': 'Hastings', 'count': 464},
 {'_id': 'Bromley', 'count': 460},
 {'_id': 'Ashford', 'count': 427},
 {'_id': 'Havering', 'count': 397},
 {'_id': 'Dartford', 'count': 383},
 {'_id': 'Braintree', 'count': 382},
 {'_id': 'Basildon', 'count': 362},
 {'_id': 'Gravesham', 'count': 339},
 {'_id': 'Tonbridge and Malling', 'count': 325},
 {'_id': 'Thurrock', 'count': 313},
 {'_id': 'Barking and Dagenham', 'count': 301},
 {'_id': 'Can

In [18]:
# Convert the result to a Pandas DataFrame
local_auth_hyg_db = pd.DataFrame(results)
# Display the number of rows in the DataFrame
local_auth_hyg_db.shape[0]
# Display the first 10 rows of the DataFrame
local_auth_hyg_db.head()

Unnamed: 0,_id,count
0,Thanet,1130
1,Greenwich,882
2,Maidstone,713
3,Newham,711
4,Swale,686
