In [None]:
# Prepare cleaned, aggregated data specifically for Power BI
import pandas as pd

# 1. Load all necessary data
daily_sales = pd.read_csv('/content/drive/MyDrive/GlobalSuperstore_Project/data/processed/daily_sales_agg.csv')
forecast_data = pd.read_csv('/content/drive/MyDrive/GlobalSuperstore_Project/data/model_outputs/sales_forecast_90days.csv')
customers = pd.read_csv('/content/drive/MyDrive/GlobalSuperstore_Project/data/model_outputs/customers_segmented.csv')
products = pd.read_csv('/content/drive/MyDrive/GlobalSuperstore_Project/data/model_outputs/product_analysis.csv')
processed_data = pd.read_csv('/content/drive/MyDrive/GlobalSuperstore_Project/data/processed/fully_processed.csv')

In [None]:
# 2. Create aggregated datasets for Power BI

# Sales by Region-Month
sales_by_region_month = processed_data.groupby([
    pd.to_datetime(processed_data['Order Date']).dt.to_period('M'),
    'Region_Encoded', 'Country', 'State', 'City'
]).agg({
    'Sales': 'sum',
    'Profit': 'sum',
    'Quantity': 'sum',
    'Order ID': 'nunique'
}).reset_index()

In [None]:
# Customer Performance
customer_performance = processed_data.groupby('Customer ID').agg({
    'Sales': ['sum', 'count', 'mean'],
    'Profit': ['sum', 'mean'],
    'Order Date': ['min', 'max']
}).reset_index()

In [None]:
# Product Category Performance
category_performance = processed_data.groupby(['Category', 'Sub-Category']).agg({
    'Sales': 'sum',
    'Profit': 'sum',
    'Quantity': 'sum'
}).reset_index()

In [None]:
# 3. Save to Power BI folder
powerbi_path = '/content/drive/MyDrive/GlobalSuperstore_Project/powerbi'

sales_by_region_month.to_csv(powerbi_path + 'sales_region_month.csv', index=False)
customer_performance.to_csv(powerbi_path + 'customer_performance.csv', index=False)
category_performance.to_csv(powerbi_path + 'category_performance.csv', index=False)
daily_sales.to_csv(powerbi_path + 'daily_sales.csv', index=False)
forecast_data.to_csv(powerbi_path + 'sales_forecast.csv', index=False)
customers.to_csv(powerbi_path + 'customer_segments.csv', index=False)
products.to_csv(powerbi_path + 'product_analysis.csv', index=False)

print(" Power BI data created")
print(f"Location: {powerbi_path}")

 Power BI data created
Location: /content/drive/MyDrive/GlobalSuperstore_Project/powerbi
