In [None]:
import os
from pathlib import Path
import pandas as pd

# Base folder name
base_folder = "XAI_Models"

# Define categories and datasets for each category
data_categories = {
    "binary": ["adult_income", "bank_customer_churn"],
    "time_series": ["dataset3", "dataset4"],
    "multiclass": ["dataset5", "dataset6"]
}

# Create the folder structure
def create_folder_structure():
    for category, datasets in data_categories.items():
        category_path = Path(base_folder) / category
        category_path.mkdir(parents=True, exist_ok=True)
        for dataset in datasets:
            dataset_path = category_path / dataset
            dataset_path.mkdir(exist_ok=True)

# Download and save dataset to dataset1
def download_and_save_dataset():
    url = "https://archive.ics.uci.edu/ml/machine-learning-databases/adult/adult.data"
    dataset_name = "adult_income"
    dataset_path = Path(base_folder) / "binary" / "adult_income"
    dataset_path.mkdir(parents=True, exist_ok=True)

    # Load dataset
    columns = [
        "age", "workclass", "fnlwgt", "education", "education-num", "marital-status",
        "occupation", "relationship", "race", "sex", "capital-gain", "capital-loss",
        "hours-per-week", "native-country", "income"
    ]
    df = pd.read_csv(url, header=None, names=columns, skipinitialspace=True)

    # Save as CSV
    csv_file = dataset_path / f"{dataset_name}.csv"
    df.to_csv(csv_file, index=False)
    print(f"Dataset downloaded and saved as '{csv_file}'")

# Call the functions
if __name__ == "__main__":
    create_folder_structure()
    download_and_save_dataset()
    print(f"Folder structure created successfully under '{base_folder}'!")


Dataset downloaded and saved as 'XAI_Models\binary\adult_income\adult_income.csv'
Folder structure created successfully under 'XAI_Models'!
