In [1]:
import pandas as pd
import numpy as np
import random

# Set random seed for reproducibility
random.seed(42)
np.random.seed(42)

# Define hospitals and drugs
hospitals = ['Hosp_A', 'Hosp_B', 'Hosp_C']
drugs = ['Paracetamol', 'Ibuprofen', 'Amoxicillin', 'Metformin', 'Atorvastatin']

# Generate date range
dates = pd.date_range(start='2024-01-01', periods=60)  # 60 days of data

# Create empty list to store rows
data = []

# Simulate data
for date in dates:
    for hospital in hospitals:
        for drug in drugs:
            inventory = np.random.randint(50, 200)  # current stock level
            demand = np.random.randint(10, 100)     # expected usage
            data.append([date, hospital, drug, inventory, demand])

# Convert to DataFrame
df = pd.DataFrame(data, columns=['date', 'hospital_id', 'drug_name', 'inventory', 'demand'])

# Preview the data
df.head()


Unnamed: 0,date,hospital_id,drug_name,inventory,demand
0,2024-01-01,Hosp_A,Paracetamol,152,61
1,2024-01-01,Hosp_A,Ibuprofen,142,24
2,2024-01-01,Hosp_A,Amoxicillin,156,81
3,2024-01-01,Hosp_A,Metformin,70,92
4,2024-01-01,Hosp_A,Atorvastatin,124,84


In [2]:
# Save the full dataset
df.to_csv('../data/inventory.csv', index=False)
print("Dataset saved to data/inventory.csv")


Dataset saved to data/inventory.csv


In [3]:
# Create separate datasets for each hospital
for hospital in hospitals:
    df_hosp = df[df['hospital_id'] == hospital]
    df_hosp.to_csv(f'../data/inventory_{hospital}.csv', index=False)
    print(f"Saved: inventory_{hospital}.csv")


Saved: inventory_Hosp_A.csv
Saved: inventory_Hosp_B.csv
Saved: inventory_Hosp_C.csv
