In [5]:
import pandas as pd

# Path to your Excel file
excel_file_path = '../data/rawdata.xlsx'

try:
    # --- Load Table S5 ---
    df5 = pd.read_excel(excel_file_path, sheet_name='Table S5', header=1)
    df5.columns = df5.columns.str.strip()
    # Select and rename columns to a standard format
    df5_clean = df5[['cation', 'anion', 'T_K_', 'P_kPa_', 'x_CO2']].copy()
    df5_clean.rename(columns={
        'T_K_': 'Temperature_K',
        'P_kPa_': 'Pressure_kPa',
        'x_CO2': 'CO2_solubility'
    }, inplace=True)
    print("Successfully loaded and cleaned 'Table S5'.")

    # --- Load Table S6 ---
    df6 = pd.read_excel(excel_file_path, sheet_name='Table S6', header=0)
    df6.columns = df6.columns.str.strip()
    # Convert pressure from bar to kPa (1 bar = 100 kPa)
    df6['P [kPa]'] = df6['P [bar]'] * 100
    # Select and rename columns to the same standard format
    df6_clean = df6[['cation', 'anion', 'T [K]', 'P [kPa]', 'x_CO2']].copy()
    df6_clean.rename(columns={
        'T [K]': 'Temperature_K',
        'P [kPa]': 'Pressure_kPa',
        'x_CO2': 'CO2_solubility'
    }, inplace=True)
    print("Successfully loaded and cleaned 'Table S6'.")

    # --- Combine the two datasets ---
    df_combined = pd.concat([df5_clean, df6_clean], ignore_index=True)
    df_combined.dropna(inplace=True) # Remove any rows with missing values

    print(f"\nCombined dataset has a total of {len(df_combined)} data points.")

    # --- Save the final, combined dataset ---
    output_filename = '../data/cleaned_experimental_data_combined.csv'
    df_combined.to_csv(output_filename, index=False)

    print(f"Final combined data saved to '{output_filename}'")
    print("\n--- Preview of Final Combined Data ---")
    print(df_combined.head())

except Exception as e:
    print(f"An error occurred: {e}")

Successfully loaded and cleaned 'Table S5'.
Successfully loaded and cleaned 'Table S6'.

Combined dataset has a total of 12005 data points.
Final combined data saved to '../data/cleaned_experimental_data_combined.csv'

--- Preview of Final Combined Data ---
       cation   anion  Temperature_K  Pressure_kPa  CO2_solubility
0  [(ETO)2IM]  [Tf2N]         323.85       22330.0           0.778
1  [(ETO)2IM]  [Tf2N]         323.95       10340.0           0.712
2  [(ETO)2IM]  [Tf2N]         343.55        7510.0           0.554
3  [(ETO)2IM]  [Tf2N]         324.15        7110.0           0.626
4  [(ETO)2IM]  [Tf2N]         363.15        5250.0           0.396
