In [1]:
# Dependencies
import numpy as np
import pandas as pd

In [2]:
# Path to the CSV files
mcdonalds_csv = 'Resources/mcdonalds.csv'
subway_csv = 'Resources/subway.csv'
starbucks_drinks_csv = 'Resources/starbucks_menu_drink.csv'
starbucks_food_csv = 'Resources/starbucks-menu-nutrition-food-test.tsv'

In [3]:
# Create the IDs data frame for the restaurant names

data = [[1000,'subway'], [2000, 'mcdonalds'], [3000, 'starbucks']]
restaurant_id = pd.DataFrame(data, columns = ['id', 'name'])

# Display the new data frame

restaurant_id

Unnamed: 0,id,name
0,1000,subway
1,2000,mcdonalds
2,3000,starbucks


In [4]:
# Export data frame to csv file

restaurant_id.to_csv (r'New Tables/restaurant_id_df.csv', index = False, header=True)


### Cleaning Process

In [5]:
# Read file (Subway Information)

subway_df = pd.read_csv(subway_csv)
subway_df.head()

Unnamed: 0,Category,Item,Serving Size,Calories,Calories from Fat,Total Fat,Total Fat (% Daily Value),Saturated Fat,Saturated Fat (% Daily Value),Trans Fat,...,Carbohydrates,Carbohydrates (% Daily Value),Dietary Fiber,Dietary Fiber (% Daily Value),Sugars,Protein,Vitamin A (% Daily Value),Vitamin C (% Daily Value),Calcium (% Daily Value),Iron (% Daily Value)
0,Breakfast,Egg McMuffin,4.8 oz (136 g),300,120,13.0,20,5.0,25,0.0,...,31,10,4,17,3,17,10,0,25,15
1,Breakfast,Egg White Delight,4.8 oz (135 g),250,70,8.0,12,3.0,15,0.0,...,30,10,4,17,3,18,6,0,25,8
2,Breakfast,Sausage McMuffin,3.9 oz (111 g),370,200,23.0,35,8.0,42,0.0,...,29,10,4,17,2,14,8,0,25,10
3,Breakfast,Sausage McMuffin with Egg,5.7 oz (161 g),450,250,28.0,43,10.0,52,0.0,...,30,10,4,17,2,21,15,0,30,15
4,Breakfast,Sausage McMuffin with Egg Whites,5.7 oz (161 g),400,210,23.0,35,8.0,42,0.0,...,30,10,4,17,2,21,6,0,25,10


In [6]:
# Add ID Columns to the data frame (Restaurant, Category, Item)

subway_df['Restaurant ID'] = 1000
subway_df['Category ID'] = 1
subway_df['Item ID'] = 1

In [7]:
# Reorganized the columns

subway_df = subway_df[['Restaurant ID',
       'Category ID', 'Item ID','Category', 'Item', 'Serving Size', 'Calories', 'Calories from Fat',
       'Total Fat', 'Total Fat (% Daily Value)', 'Saturated Fat',
       'Saturated Fat (% Daily Value)', 'Trans Fat', 'Cholesterol',
       'Cholesterol (% Daily Value)', 'Sodium', 'Sodium (% Daily Value)',
       'Carbohydrates', 'Carbohydrates (% Daily Value)', 'Dietary Fiber',
       'Dietary Fiber (% Daily Value)', 'Sugars', 'Protein',
       'Vitamin A (% Daily Value)', 'Vitamin C (% Daily Value)',
       'Calcium (% Daily Value)', 'Iron (% Daily Value)']]

In [8]:
# Rename the column names

subway_df = subway_df.rename(columns = {'Total Fat':'Total Fat (g)', 'Saturated Fat':'Saturated Fat (g)','Trans Fat':'Trans Fat (g)', 'Cholesterol':'Cholesterol (mg)',
       'Sodium' : 'Sodium (mg)', 'Carbohydrates' : 'Carbohydrates (g)', 'Dietary Fiber' : 'Dietary Fiber (g)',
       'Sugars': 'Sugars (g)' , 'Protein': 'Protein (g)'})

# Display the data frame to visualize the changes 
subway_df.head()

Unnamed: 0,Restaurant ID,Category ID,Item ID,Category,Item,Serving Size,Calories,Calories from Fat,Total Fat (g),Total Fat (% Daily Value),...,Carbohydrates (g),Carbohydrates (% Daily Value),Dietary Fiber (g),Dietary Fiber (% Daily Value),Sugars (g),Protein (g),Vitamin A (% Daily Value),Vitamin C (% Daily Value),Calcium (% Daily Value),Iron (% Daily Value)
0,1000,1,1,Breakfast,Egg McMuffin,4.8 oz (136 g),300,120,13.0,20,...,31,10,4,17,3,17,10,0,25,15
1,1000,1,1,Breakfast,Egg White Delight,4.8 oz (135 g),250,70,8.0,12,...,30,10,4,17,3,18,6,0,25,8
2,1000,1,1,Breakfast,Sausage McMuffin,3.9 oz (111 g),370,200,23.0,35,...,29,10,4,17,2,14,8,0,25,10
3,1000,1,1,Breakfast,Sausage McMuffin with Egg,5.7 oz (161 g),450,250,28.0,43,...,30,10,4,17,2,21,15,0,30,15
4,1000,1,1,Breakfast,Sausage McMuffin with Egg Whites,5.7 oz (161 g),400,210,23.0,35,...,30,10,4,17,2,21,6,0,25,10


In [10]:
# Read file (McDonalds information)

mcdonalds_df = pd.read_csv(mcdonalds_csv)
mcdonalds_df.head()

Unnamed: 0,Category,Item,Serving Size,Calories,Calories from Fat,Total Fat,Total Fat (% Daily Value),Saturated Fat,Saturated Fat (% Daily Value),Trans Fat,...,Carbohydrates,Carbohydrates (% Daily Value),Dietary Fiber,Dietary Fiber (% Daily Value),Sugars,Protein,Vitamin A (% Daily Value),Vitamin C (% Daily Value),Calcium (% Daily Value),Iron (% Daily Value)
0,Breakfast,Egg McMuffin,4.8 oz (136 g),300,120,13.0,20,5.0,25,0.0,...,31,10,4,17,3,17,10,0,25,15
1,Breakfast,Egg White Delight,4.8 oz (135 g),250,70,8.0,12,3.0,15,0.0,...,30,10,4,17,3,18,6,0,25,8
2,Breakfast,Sausage McMuffin,3.9 oz (111 g),370,200,23.0,35,8.0,42,0.0,...,29,10,4,17,2,14,8,0,25,10
3,Breakfast,Sausage McMuffin with Egg,5.7 oz (161 g),450,250,28.0,43,10.0,52,0.0,...,30,10,4,17,2,21,15,0,30,15
4,Breakfast,Sausage McMuffin with Egg Whites,5.7 oz (161 g),400,210,23.0,35,8.0,42,0.0,...,30,10,4,17,2,21,6,0,25,10


In [11]:
# Add Restaurant ID Column to the data frame

mcdonalds_df['Restaurant ID'] = 2000

In [12]:
# Reorganize the columns

mcdonalds_df = mcdonalds_df[['Restaurant ID',
       'Category', 'Item', 'Serving Size', 'Calories', 'Calories from Fat',
       'Total Fat', 'Total Fat (% Daily Value)', 'Saturated Fat',
       'Saturated Fat (% Daily Value)', 'Trans Fat', 'Cholesterol',
       'Cholesterol (% Daily Value)', 'Sodium', 'Sodium (% Daily Value)',
       'Carbohydrates', 'Carbohydrates (% Daily Value)', 'Dietary Fiber',
       'Dietary Fiber (% Daily Value)', 'Sugars', 'Protein',
       'Vitamin A (% Daily Value)', 'Vitamin C (% Daily Value)',
       'Calcium (% Daily Value)', 'Iron (% Daily Value)']]

In [13]:
# Rename the columns
mcdonalds_df = mcdonalds_df.rename(columns = {'Total Fat':'Total Fat (g)', 'Saturated Fat':'Saturated Fat (g)','Trans Fat':'Trans Fat (g)', 'Cholesterol':'Cholesterol (mg)',
       'Sodium' : 'Sodium (mg)', 'Carbohydrates' : 'Carbohydrates (g)', 'Dietary Fiber' : 'Dietary Fiber (g)',
       'Sugars': 'Sugars (g)' , 'Protein': 'Protein (g)'})

# Display the data frame to visualize the changes

mcdonalds_df.head()

Unnamed: 0,Restaurant ID,Category,Item,Serving Size,Calories,Calories from Fat,Total Fat (g),Total Fat (% Daily Value),Saturated Fat (g),Saturated Fat (% Daily Value),...,Carbohydrates (g),Carbohydrates (% Daily Value),Dietary Fiber (g),Dietary Fiber (% Daily Value),Sugars (g),Protein (g),Vitamin A (% Daily Value),Vitamin C (% Daily Value),Calcium (% Daily Value),Iron (% Daily Value)
0,2000,Breakfast,Egg McMuffin,4.8 oz (136 g),300,120,13.0,20,5.0,25,...,31,10,4,17,3,17,10,0,25,15
1,2000,Breakfast,Egg White Delight,4.8 oz (135 g),250,70,8.0,12,3.0,15,...,30,10,4,17,3,18,6,0,25,8
2,2000,Breakfast,Sausage McMuffin,3.9 oz (111 g),370,200,23.0,35,8.0,42,...,29,10,4,17,2,14,8,0,25,10
3,2000,Breakfast,Sausage McMuffin with Egg,5.7 oz (161 g),450,250,28.0,43,10.0,52,...,30,10,4,17,2,21,15,0,30,15
4,2000,Breakfast,Sausage McMuffin with Egg Whites,5.7 oz (161 g),400,210,23.0,35,8.0,42,...,30,10,4,17,2,21,6,0,25,10


In [14]:
# Read file (Starbucks Drinks)

starbucks_drinks_df = pd.read_csv(starbucks_drinks_csv)
starbucks_drinks_df

Unnamed: 0,Beverage_category,Beverage,Beverage_prep,Calories,Total Fat (g),Trans Fat (g),Saturated Fat (g),Sodium (mg),Total Carbohydrates (g),Cholesterol (mg),Dietary Fibre (g),Sugars (g),Protein (g),Vitamin A (% DV),Vitamin C (% DV),Calcium (% DV),Iron (% DV),Caffeine (mg)
0,Coffee,Brewed Coffee,Short,3,0.1,0.0,0.0,0,5,0,0,0,0.3,0%,0%,0%,0%,175
1,Coffee,Brewed Coffee,Tall,4,0.1,0.0,0.0,0,10,0,0,0,0.5,0%,0%,0%,0%,260
2,Coffee,Brewed Coffee,Grande,5,0.1,0.0,0.0,0,10,0,0,0,1.0,0%,0%,0%,0%,330
3,Coffee,Brewed Coffee,Venti,5,0.1,0.0,0.0,0,10,0,0,0,1.0,0%,0%,2%,0%,410
4,Classic Espresso Drinks,Caffè Latte,Short Nonfat Milk,70,0.1,0.1,0.0,5,75,10,0,9,6.0,10%,0%,20%,0%,75
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
237,Frappuccino® Blended Crème,Strawberries & Crème (Without Whipped Cream),Soymilk,320,3 2,0.4,0.0,0,250,67,1,64,5.0,6%,8%,20%,10%,0
238,Frappuccino® Blended Crème,Vanilla Bean (Without Whipped Cream),Tall Nonfat Milk,170,0.1,0.1,0.0,0,160,39,0,38,4.0,6%,0%,10%,0%,0
239,Frappuccino® Blended Crème,Vanilla Bean (Without Whipped Cream),Whole Milk,200,3.5,2.0,0.1,10,160,39,0,38,3.0,6%,0%,10%,0%,0
240,Frappuccino® Blended Crème,Vanilla Bean (Without Whipped Cream),Soymilk,180,1.5,0.2,0.0,0,160,37,1,35,3.0,4%,0%,10%,6%,0


In [15]:
# Add Restaurant ID Column to the data frame

starbucks_drinks_df['Restaurant ID'] = 3000

In [16]:
# Concatenate 'Beverage' and 'Beverage_prep' columns

starbucks_drinks_df['Beverage'] = starbucks_drinks_df['Beverage'] + ' ' + starbucks_drinks_df['Beverage_prep']

In [17]:
# Rename the columns (Standardize column names)
starbucks_drinks_df = starbucks_drinks_df.rename(columns={'Beverage_category':'Category', 'Beverage':'Item', ' Total Carbohydrates (g) ':'Carbohydrates (g)',
                                   'Dietary Fibre (g)' : 'Dietary Fiber (g)', 'Vitamin A (% DV)' : 'Vitamin A (% Daily Value)',
                                   'Vitamin C (% DV)' : 'Vitamin C (% Daily Value)' , ' Calcium (% DV) ':'Calcium (% Daily Value)', 'Iron (% DV) ' : 'Iron (% Daily Value)'})

In [18]:
# Remove white spaces from the column names

starbucks_drinks_df = starbucks_drinks_df.rename(columns = {' Total Fat (g)':'Total Fat (g)',
       'Trans Fat (g) ' : 'Trans Fat (g)',' Sodium (mg)' : 'Sodium (mg)',
       ' Dietary Fibre (g)': 'Dietary Fiber (g)',
       ' Sugars (g)': 'Sugars (g)', ' Protein (g) ':'Protein (g)', 'Vitamin A (% DV) ': 'Vitamin A (% Daily Value)'})

In [None]:
# Reorganize the columns 

starbucks_drinks_df = starbucks_drinks_df[['Restaurant ID', 'Category', 'Item', 'Calories','Total Fat (g)', 'Saturated Fat (g)', 'Trans Fat (g)',
      'Cholesterol (mg)', 'Sodium (mg)', 'Carbohydrates (g)','Dietary Fiber (g)', 'Sugars (g)', 'Protein (g)','Vitamin A (% Daily Value)', 'Vitamin C (% Daily Value)','Calcium (% Daily Value)', 'Iron (% Daily Value)']]

# Display the data frame to visualize the changes

starbucks_drinks_df.head()

### Unification Process

In [19]:
# Concatenate Subway and McDonalds data frames

combined_df = pd.concat([subway_df, mcdonalds_df])

# Display the new data frame

combined_df

Unnamed: 0,Restaurant ID,Category ID,Item ID,Category,Item,Serving Size,Calories,Calories from Fat,Total Fat (g),Total Fat (% Daily Value),...,Carbohydrates (g),Carbohydrates (% Daily Value),Dietary Fiber (g),Dietary Fiber (% Daily Value),Sugars (g),Protein (g),Vitamin A (% Daily Value),Vitamin C (% Daily Value),Calcium (% Daily Value),Iron (% Daily Value)
0,1000,1.0,1.0,Breakfast,Egg McMuffin,4.8 oz (136 g),300,120,13.0,20,...,31,10,4,17,3,17,10,0,25,15
1,1000,1.0,1.0,Breakfast,Egg White Delight,4.8 oz (135 g),250,70,8.0,12,...,30,10,4,17,3,18,6,0,25,8
2,1000,1.0,1.0,Breakfast,Sausage McMuffin,3.9 oz (111 g),370,200,23.0,35,...,29,10,4,17,2,14,8,0,25,10
3,1000,1.0,1.0,Breakfast,Sausage McMuffin with Egg,5.7 oz (161 g),450,250,28.0,43,...,30,10,4,17,2,21,15,0,30,15
4,1000,1.0,1.0,Breakfast,Sausage McMuffin with Egg Whites,5.7 oz (161 g),400,210,23.0,35,...,30,10,4,17,2,21,6,0,25,10
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
255,2000,,,Smoothies & Shakes,McFlurry with Oreo Cookies (Small),10.1 oz (285 g),510,150,17.0,26,...,80,27,1,4,64,12,15,0,40,8
256,2000,,,Smoothies & Shakes,McFlurry with Oreo Cookies (Medium),13.4 oz (381 g),690,200,23.0,35,...,106,35,1,5,85,15,20,0,50,10
257,2000,,,Smoothies & Shakes,McFlurry with Oreo Cookies (Snack),6.7 oz (190 g),340,100,11.0,17,...,53,18,1,2,43,8,10,0,25,6
258,2000,,,Smoothies & Shakes,McFlurry with Reese's Peanut Butter Cups (Medium),14.2 oz (403 g),810,290,32.0,50,...,114,38,2,9,103,21,20,0,60,6


In [20]:
# Add Starbucks Drink data fram to the Combined data frame

combined_df = pd.concat([combined_df, starbucks_drinks_df])
combined_df

Unnamed: 0,Restaurant ID,Category ID,Item ID,Category,Item,Serving Size,Calories,Calories from Fat,Total Fat (g),Total Fat (% Daily Value),...,Dietary Fiber (g),Dietary Fiber (% Daily Value),Sugars (g),Protein (g),Vitamin A (% Daily Value),Vitamin C (% Daily Value),Calcium (% Daily Value),Iron (% Daily Value),Beverage_prep,Caffeine (mg)
0,1000,1.0,1.0,Breakfast,Egg McMuffin,4.8 oz (136 g),300,120.0,13,20.0,...,4,17.0,3,17.0,10,0,25,15,,
1,1000,1.0,1.0,Breakfast,Egg White Delight,4.8 oz (135 g),250,70.0,8,12.0,...,4,17.0,3,18.0,6,0,25,8,,
2,1000,1.0,1.0,Breakfast,Sausage McMuffin,3.9 oz (111 g),370,200.0,23,35.0,...,4,17.0,2,14.0,8,0,25,10,,
3,1000,1.0,1.0,Breakfast,Sausage McMuffin with Egg,5.7 oz (161 g),450,250.0,28,43.0,...,4,17.0,2,21.0,15,0,30,15,,
4,1000,1.0,1.0,Breakfast,Sausage McMuffin with Egg Whites,5.7 oz (161 g),400,210.0,23,35.0,...,4,17.0,2,21.0,6,0,25,10,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
237,3000,,,Frappuccino® Blended Crème,Strawberries & Crème (Without Whipped Cream) S...,,320,,3 2,,...,1,,64,5.0,6%,8%,20%,10%,Soymilk,0
238,3000,,,Frappuccino® Blended Crème,Vanilla Bean (Without Whipped Cream) Tall Nonf...,,170,,0.1,,...,0,,38,4.0,6%,0%,10%,0%,Tall Nonfat Milk,0
239,3000,,,Frappuccino® Blended Crème,Vanilla Bean (Without Whipped Cream) Whole Milk,,200,,3.5,,...,0,,38,3.0,6%,0%,10%,0%,Whole Milk,0
240,3000,,,Frappuccino® Blended Crème,Vanilla Bean (Without Whipped Cream) Soymilk,,180,,1.5,,...,1,,35,3.0,4%,0%,10%,6%,Soymilk,0


In [21]:
# Lower case the column names

combined_df.columns= combined_df.columns.str.lower()

In [23]:
# Create the ID numbers for the items

item_dict = {item_name:item_id for item_name, item_id in list(zip(combined_df.item.unique(), range(1, combined_df.shape[0])))}

In [24]:
# Store item_dict into a data frame
item_id_df = pd.DataFrame(list(item_dict.items()),columns = ['item','id'])

# Display the new data frame
item_id_df.head()

Unnamed: 0,item,id
0,Egg McMuffin,1
1,Egg White Delight,2
2,Sausage McMuffin,3
3,Sausage McMuffin with Egg,4
4,Sausage McMuffin with Egg Whites,5


In [25]:
# Export data frame to csv file

item_id_df.to_csv (r'New Tables/item_id_df.csv', index = False, header=True)

In [26]:
# Add the new Item IDs to the combined_df
combined_df['item id'] = combined_df['item'].map(item_dict)
combined_df.head()

Unnamed: 0,restaurant id,category id,item id,category,item,serving size,calories,calories from fat,total fat (g),total fat (% daily value),...,dietary fiber (g),dietary fiber (% daily value),sugars (g),protein (g),vitamin a (% daily value),vitamin c (% daily value),calcium (% daily value),iron (% daily value),beverage_prep,caffeine (mg)
0,1000,1.0,1,Breakfast,Egg McMuffin,4.8 oz (136 g),300,120.0,13,20.0,...,4,17.0,3,17.0,10,0,25,15,,
1,1000,1.0,2,Breakfast,Egg White Delight,4.8 oz (135 g),250,70.0,8,12.0,...,4,17.0,3,18.0,6,0,25,8,,
2,1000,1.0,3,Breakfast,Sausage McMuffin,3.9 oz (111 g),370,200.0,23,35.0,...,4,17.0,2,14.0,8,0,25,10,,
3,1000,1.0,4,Breakfast,Sausage McMuffin with Egg,5.7 oz (161 g),450,250.0,28,43.0,...,4,17.0,2,21.0,15,0,30,15,,
4,1000,1.0,5,Breakfast,Sausage McMuffin with Egg Whites,5.7 oz (161 g),400,210.0,23,35.0,...,4,17.0,2,21.0,6,0,25,10,,


In [27]:
# Create the ID numbers for the categories

category_dict = {category_name:category_id for category_name, category_id in list(zip(combined_df.category.unique(), range(100, combined_df.shape[0])))}

In [28]:
# Store category_dict into a data frame
category_id_df = pd.DataFrame(list(category_dict.items()),columns = ['category','id'])

# Display the new data frame
category_id_df.head()

Unnamed: 0,category,id
0,Breakfast,100
1,Beef & Pork,101
2,Chicken & Fish,102
3,Salads,103
4,Snacks & Sides,104


In [29]:
# Add the new Category IDs to the combined_df
combined_df['category id'] = combined_df['category'].map(category_dict)
combined_df.head()

Unnamed: 0,restaurant id,category id,item id,category,item,serving size,calories,calories from fat,total fat (g),total fat (% daily value),...,dietary fiber (g),dietary fiber (% daily value),sugars (g),protein (g),vitamin a (% daily value),vitamin c (% daily value),calcium (% daily value),iron (% daily value),beverage_prep,caffeine (mg)
0,1000,100,1,Breakfast,Egg McMuffin,4.8 oz (136 g),300,120.0,13,20.0,...,4,17.0,3,17.0,10,0,25,15,,
1,1000,100,2,Breakfast,Egg White Delight,4.8 oz (135 g),250,70.0,8,12.0,...,4,17.0,3,18.0,6,0,25,8,,
2,1000,100,3,Breakfast,Sausage McMuffin,3.9 oz (111 g),370,200.0,23,35.0,...,4,17.0,2,14.0,8,0,25,10,,
3,1000,100,4,Breakfast,Sausage McMuffin with Egg,5.7 oz (161 g),450,250.0,28,43.0,...,4,17.0,2,21.0,15,0,30,15,,
4,1000,100,5,Breakfast,Sausage McMuffin with Egg Whites,5.7 oz (161 g),400,210.0,23,35.0,...,4,17.0,2,21.0,6,0,25,10,,


In [30]:
# Export data frame to csv file

category_id_df.to_csv (r'New Tables/category_id_df.csv', index = False, header=True)

In [32]:
# Drop VARCHAR and other columns

clean_combined_df = combined_df.drop(columns=['category', 'item', 'beverage_prep', 'caffeine (mg)'])
clean_combined_df.head()

Unnamed: 0,restaurant id,category id,item id,serving size,calories,calories from fat,total fat (g),total fat (% daily value),saturated fat (g),saturated fat (% daily value),...,carbohydrates (g),carbohydrates (% daily value),dietary fiber (g),dietary fiber (% daily value),sugars (g),protein (g),vitamin a (% daily value),vitamin c (% daily value),calcium (% daily value),iron (% daily value)
0,1000,100,1,4.8 oz (136 g),300,120.0,13,20.0,5.0,25.0,...,31,10.0,4,17.0,3,17.0,10,0,25,15
1,1000,100,2,4.8 oz (135 g),250,70.0,8,12.0,3.0,15.0,...,30,10.0,4,17.0,3,18.0,6,0,25,8
2,1000,100,3,3.9 oz (111 g),370,200.0,23,35.0,8.0,42.0,...,29,10.0,4,17.0,2,14.0,8,0,25,10
3,1000,100,4,5.7 oz (161 g),450,250.0,28,43.0,10.0,52.0,...,30,10.0,4,17.0,2,21.0,15,0,30,15
4,1000,100,5,5.7 oz (161 g),400,210.0,23,35.0,8.0,42.0,...,30,10.0,4,17.0,2,21.0,6,0,25,10


Pending taks:

- Decide how to proceed with Starbucks food menu
- Fix the serving size (Create two new columns with the two different sizes)
- Slice the clean_combined_df by restaurant
- Save as csv file the new data frames by restaurant
- Import the files to pgAdmin
- Create the report


In [None]:
#### This code is just a reference to understand how to add the IDs### It will be removed later on

chains = {"Breakfast": 1}
subway_df["Category"].map(chains)

item_dic_test = {item_name:item_id for item_name, item_id in list(zip(subway_df.Item.unique(), range(1, subway_df.shape[0])))}