In [1]:
import pandas as pd
import os

# Folder containing the CSV files
folder_path = os.getcwd()

# Get a list of all CSV files in the folder, excluding 'full_all_predictions.csv' (in case the csv where already joined)
csv_files = [f for f in os.listdir(folder_path) if f.endswith('.csv') and f != 'full_all_predictions.csv']


# Initialize a list to hold DataFrames
dataframes = []

# Read each CSV file into a DataFrame
for file in csv_files:
    file_path = os.path.join(folder_path, file)
    df = pd.read_csv(file_path)
    
    # Ensure the DATE column is in datetime format
    if 'DATE' in df.columns:
        df['DATE'] = pd.to_datetime(df['DATE'])

    # Drop unnecessary columns
    df = df.loc[:, ~df.columns.str.contains('^Unnamed')]
     
    dataframes.append(df)

# Perform outer join on the DATE column
merged_df = dataframes[0]
for df in dataframes[1:]:
    merged_df = pd.merge(merged_df, df, on='DATE', how='outer')
    
# Sort the merged DataFrame by DATE
merged_df = merged_df.sort_values(by='DATE')
merged_df.to_csv("full_all_predictions.csv", index=False)
