In [None]:
import pandas as pd
import os

# Define the directory containing the files
directory = 'forecast_files'

# Initialize a dictionary to store the PNL for each instrument
pnl_dict = {}

# Iterate over the files in the directory
for filename in os.listdir(directory):
    if filename.endswith('.csv'):
        # Load the file
        file_path = os.path.join(directory, filename)
        df = pd.read_csv(file_path)
        
        # Extract the forecast and real data columns
        forecast = df.iloc[:, 0]  # Assuming the first column is the forecast
        real_data = df.iloc[:, 3]  # Assuming the fourth column is the real data
        
        # Calculate the PNL for each instrument
        pnl = real_data - forecast
        
        # Aggregate the PNL for each instrument
        for instrument, pnl_value in pnl.items():
            if instrument not in pnl_dict:
                pnl_dict[instrument] = 0
            pnl_dict[instrument] += pnl_value

# Convert the PNL dictionary to a DataFrame
pnl_df = pd.DataFrame(list(pnl_dict.items()), columns=['Instrument', 'PNL'])

# Save the PNL DataFrame to a CSV file
pnl_df.to_csv('pnl_summary.csv', index=False)

print("PNL summary has been saved to 'pnl_summary.csv'")