## Ensuring Consistency in Multi-source Data Integration

**Description**: Validate the integration of two datasets `products_A.csv` and `products_B.csv` . Ensure consistency in product "category" information.

In [None]:
#
import pandas as pd
products_a = None
products_b = None
try:
    products_a = pd.read_csv('products_A.csv')
    products_b = pd.read_csv('products_B.csv')
except FileNotFoundError:
    print("Error: One or both of the CSV files were not found. Please ensure 'products_A.csv' and 'products_B.csv' are in the correct directory.")
    exit()
if products_a is not None and products_b is not None:
    merged_products = pd.merge(products_a, products_b, on='product_id', how='inner', suffixes=('_A', '_B'))
    if 'category_A' in merged_products.columns and 'category_B' in merged_products.columns:
        inconsistent_categories = merged_products[merged_products['category_A'].astype(str).str.lower() != merged_products['category_B'].astype(str).str.lower()]
        if not inconsistent_categories.empty:
            print("Products with Inconsistent Category Information (Case-Insensitive) Across Datasets:")
            print(inconsistent_categories[['product_id', 'category_A', 'category_B']])
            print(f"\nNumber of products with inconsistent categories (case-insensitive): {len(inconsistent_categories)}")
        else:
            print("No products found with inconsistent category information (case-insensitive) across the datasets.")
    else:
        print("Error: One or both datasets do not have a 'category' column after merging (with suffixes '_A' and '_B'). Please check the column names.")

else:
    print("Could not proceed with validating product category consistency due to missing datasets.")

Error: One or both of the CSV files were not found. Please ensure 'products_A.csv' and 'products_B.csv' are in the correct directory.
Could not proceed with validating product category consistency due to missing datasets.


: 