In [1]:
import pandas as pd
import numpy as np

# Configuration
num_days = 25 * 365
dates = pd.date_range(start="2000-01-01", periods=num_days, freq='D')
t = np.arange(num_days)

# NEW: Simulate broader values with patterns
fuel_used = 20000 + 10000 * np.sin(2 * np.pi * t / 365) + np.random.normal(0, 2000, num_days)
coal_mined = 50000 + 20000 * np.sin(2 * np.pi * t / 180) + np.random.normal(0, 5000, num_days)

# Ensure no negatives
fuel_used = np.clip(fuel_used, 500, 50000)
coal_mined = np.clip(coal_mined, 1000, 100000)

# Emission factors
CO2_PER_LITER = 2.68
CARBON_PERCENT = 0.35
CO2_PER_KG_C = 3.67

co2_emitted = fuel_used * CO2_PER_LITER
trapped_carbon = coal_mined * 1000 * CARBON_PERCENT
potential_co2 = trapped_carbon * CO2_PER_KG_C

df = pd.DataFrame({
    "Date": dates,
    "Fuel_Used_Liters": fuel_used,
    "Coal_Mined_Tonnes": coal_mined,
    "CO2_Emitted_kg": co2_emitted,
    "Trapped_Carbon_kg": trapped_carbon,
    "Potential_CO2_from_Coal_kg": potential_co2
})

df.to_csv("highrange_25yrs_indian_coalmine_data.csv", index=False)
print("High-range dataset saved.")


High-range dataset saved.
