In [None]:
# generate_and_test.ipynb

# This notebook demonstrates how to use the Dataset Generator to create and inspect data.

# Import required libraries
import pandas as pd
import os
from scripts.generate_users import generate_user_data
from scripts.generate_time_series import generate_time_series
from scripts.generate_images import generate_images
from IPython.display import Image, display

# Step 1: Generate user data
print("Generating synthetic user data...")
generate_user_data(num_records=100)

# Load and inspect user data
user_file_path = os.path.join("data", "synthetic_user_data.csv")
if os.path.exists(user_file_path):
    user_df = pd.read_csv(user_file_path)
    print("\nSample of the generated user data:")
    print(user_df.head())
else:
    print("User dataset file not found.")

# Step 2: Generate time-series data
print("\nGenerating synthetic time-series data...")
generate_time_series(num_records=50)

# Load and inspect time-series data
time_series_file_path = os.path.join("data", "synthetic_time_series.csv")
if os.path.exists(time_series_file_path):
    time_series_df = pd.read_csv(time_series_file_path)
    print("\nSample of the generated time-series data:")
    print(time_series_df.head())
else:
    print("Time-series dataset file not found.")

# Step 3: Generate synthetic images
print("\nGenerating synthetic images...")
generate_images(num_images=5)

# Display synthetic images
image_dir = os.path.join("data", "synthetic_images")
if os.path.exists(image_dir):
    image_files = [f for f in os.listdir(image_dir) if f.endswith(".png")]
    print("\nDisplaying generated images:")
    for image_file in image_files[:5]:  # Display up to 5 images
        display(Image(filename=os.path.join(image_dir, image_file)))
else:
    print("Image directory not found.")
