## Advanced Consistency Check with Hierarchical Data

**Description**: You have two datasets `orders.csv` and `order_items.csv` . Perform a consistency check to ensure each order in `orders.csv` has corresponding items in `order_items.csv` .

In [None]:
# Write your code from here
import pandas as pd

# Load the datasets
orders = None
order_items = None
try:
    orders = pd.read_csv('orders.csv')
    order_items = pd.read_csv('order_items.csv')
except FileNotFoundError:
    print("Error: One or both of the CSV files were not found. Please ensure 'orders.csv' and 'order_items.csv' are in the correct directory.")
    exit()

if orders is not None and order_items is not None:
    # Assuming 'order_id' is the common identifier linking the two datasets
    if 'order_id' in orders.columns and 'order_id' in order_items.columns:
        # Get all unique order IDs from the orders dataset
        all_order_ids = set(orders['order_id'])

        # Get all unique order IDs present in the order items dataset
        item_order_ids = set(order_items['order_id'])

        # Find order IDs that are in the orders dataset but not in the order items dataset
        orders_without_items = all_order_ids - item_order_ids

        if orders_without_items:
            print("Consistency Check Result: Found orders without corresponding items in 'order_items.csv':")
            print(f"Number of orders without items: {len(orders_without_items)}")
            # Optionally, print the specific order IDs without items
            # print("Order IDs without items:", orders_without_items)
        else:
            print("Consistency Check Result: All orders in 'orders.csv' have corresponding items in 'order_items.csv'.")

        # Optional: Check for order items without a corresponding order (might indicate data integrity issues)
        orders_without_items_reverse = item_order_ids - all_order_ids
        if orders_without_items_reverse:
            print("\nPotential Data Integrity Issue: Found items in 'order_items.csv' without a corresponding order in 'orders.csv':")
            print(f"Number of items without a corresponding order: {len(orders_without_items_reverse)}")
            # Optionally, print the specific order IDs of these items
            # print("Order IDs of items without orders:", orders_without_items_reverse)
    else:
        print("Error: 'order_id' column not found in one or both of the datasets. Ensure 'order_id' is the common identifier.")

else:
    print("Could not proceed with the consistency check due to missing datasets.")
    

Error: One or both of the CSV files were not found. Please ensure 'orders.csv' and 'order_items.csv' are in the correct directory.
Could not proceed with the consistency check due to missing datasets.


: 