# Data Generation - Ethiopia Sales Data

This notebook generates synthetic sales data for Ethiopian business forecasting.

## Objectives
- Generate realistic sales transactions
- Include Ethiopian context (regions, products, holidays)
- Add seasonality and trends
- Create comprehensive dataset for analysis


In [None]:
# Import libraries
import sys
sys.path.append('..')

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from datetime import datetime, timedelta
import os

from src.data_generator import EthiopiaSalesDataGenerator

# Set style
sns.set_style('whitegrid')
plt.rcParams['figure.figsize'] = (12, 6)

print("âœ“ Libraries imported successfully")


## 1. Initialize Data Generator


In [None]:
# Create data generator instance
generator = EthiopiaSalesDataGenerator(
    start_date='2020-01-01',
    end_date='2024-10-31',
    seed=42
)

print("Data Generator Configuration:")
print(f"Start Date: {generator.start_date}")
print(f"End Date: {generator.end_date}")
print(f"Regions: {generator.regions}")
print(f"Product Categories: {generator.product_categories}")


## 2. Generate Sales Data


In [None]:
# Generate data
df = generator.generate_sales_data()

print(f"Generated {len(df)} transactions")
print(f"\nDataset Shape: {df.shape}")
print(f"\nFirst few rows:")
df.head(10)
