In [5]:
import pandas as pd

# Load the users.json file
users = pd.read_json("users.json")

# Load the orders.csv file
orders = pd.read_csv("orders.csv")

# Load the restaurants.csv file (assuming it exists and contains restaurant ratings)
# If restaurants.csv does not exist, please upload it or specify the correct file.
try:
    restaurants = pd.read_csv("restaurants.csv")
except FileNotFoundError:
    print("Error: 'restaurants.csv' not found. Please ensure the file is uploaded or specify the correct filename.")
    # If the file is named restaurants.sql and contains actual data, you might need a different loading mechanism.
    # For now, we'll assume a CSV. If it's SQL, further steps would be needed to load it into a DataFrame.
    restaurants = pd.DataFrame(columns=['restaurant_id', 'restaurant_rating']) # Create empty df to avoid further errors

# Merge orders with users on user_id
data = orders.merge(users, on="user_id", how="left")

# Merge restaurant data with the main data on restaurant_id
data = data.merge(restaurants, on="restaurant_id", how="left")

# 1. Total orders placed by Gold members
gold_orders = data[data["membership"] == "Gold"]
total_gold_orders = len(gold_orders)

# 2. Total revenue generated from orders placed in Hyderabad city
hyderabad_revenue = round(data[data["city"] == "Hyderabad"]["total_amount"].sum())

# 3. Distinct users who placed at least one order
distinct_users = data["user_id"].nunique()

# 4. Average order value for Gold members (rounded to 2 decimals)
avg_gold_order_value = round(gold_orders["total_amount"].mean(), 2)

# 5. Orders placed for restaurants with rating \u2265 4.5
high_rating_orders = len(data[data["restaurant_rating"] >= 4.5])

# 6. Orders placed in the top revenue city among Gold members only
gold_city_revenue = gold_orders.groupby("city")["total_amount"].sum()
top_gold_city = gold_city_revenue.idxmax()
orders_in_top_gold_city = len(gold_orders[gold_orders["city"] == top_gold_city])

# Print results
print("1. Total orders by Gold members:", total_gold_orders)
print("2. Total revenue from Hyderabad:", hyderabad_revenue)
print("3. Distinct users who placed orders:", distinct_users)
print("4. Average order value (Gold members):", avg_gold_order_value)
print("5. Orders with restaurant rating \u2265 4.5:", high_rating_orders)
print("6. Orders in top revenue city (Gold members):", orders_in_top_gold_city)


Error: 'restaurants.csv' not found. Please ensure the file is uploaded or specify the correct filename.
1. Total orders by Gold members: 4987
2. Total revenue from Hyderabad: 1889367
3. Distinct users who placed orders: 2883
4. Average order value (Gold members): 797.15
5. Orders with restaurant rating â‰¥ 4.5: 0
6. Orders in top revenue city (Gold members): 1337


In [2]:
from google.colab import files

# Upload files
uploaded = files.upload()

Saving food-delivery-hackathon.zip to food-delivery-hackathon.zip
Saving restaurants.sql to restaurants.sql
Saving users.json to users.json
Saving orders.csv to orders.csv
