In [2]:
import pandas as pd
import glob
import matplotlib.pyplot as plt
import seaborn as sns
import numpy as np

def load_and_analyze_files():
    # Get all CSV files for both tasks
    billsum_files = glob.glob('./Billsum*.csv')
    squad_files = glob.glob('./SQuAD*.csv')

    # Function to extract model info from filename
    def get_model_info(filename):
        parts = filename.split('-')
        task = 'Billsum' if 'Billsum' in filename else 'SQuAD'
        norm_type = 'LN' if 'LN' in filename else 'RMSN'
        variant = parts[-2].split('/')[-1]  # Extract variant name
        metric_type = 'grad_norm' if 'grad-norm' in filename else 'loss_train'
        return task, norm_type, variant, metric_type

    # Dictionary to store DataFrames
    all_data = {}

    # Load files and examine structure
    for file in billsum_files + squad_files:
        task, norm_type, variant, metric_type = get_model_info(file)
        key = f"{task}-{norm_type}-{variant}-{metric_type}"
        df = pd.read_csv(file)
        all_data[key] = df
        print(f"\nLoaded {key}")
        print(f"Shape: {df.shape}")
        print("Columns:", df.columns.tolist())
        print("First few rows:")
        print(df.head())
        print("-" * 50)

    return all_data

# Run the analysis
data_dict = load_and_analyze_files()


Loaded Billsum-RMSN- RMSN AttnOnly train-loss_train
Shape: (6666, 4)
Columns: ['Step', 'lemon-disco-5 - train/loss', 'lemon-disco-5 - train/loss__MIN', 'lemon-disco-5 - train/loss__MAX']
First few rows:
   Step  lemon-disco-5 - train/loss  lemon-disco-5 - train/loss__MIN  \
0     0                      5.6705                           5.6705   
1     1                      5.6705                           5.6705   
2     2                      5.8682                           5.8682   
3     3                      5.8682                           5.8682   
4     4                      5.6944                           5.6944   

   lemon-disco-5 - train/loss__MAX  
0                           5.6705  
1                           5.6705  
2                           5.8682  
3                           5.8682  
4                           5.6944  
--------------------------------------------------

Loaded Billsum-LN- LN noNorm grad-grad_norm
Shape: (6666, 4)
Columns: ['Step', 'gallant-t