In [1]:
import pandas as pd 

# Merge the csv files in the data directory
def merge_csv_files(file_list, output_file):
    """
    Merges multiple CSV files into a single CSV file.
    
    Parameters:
    file_list (list): List of file paths to the CSV files to be merged.
    output_file (str): Path to the output CSV file.
    """
    # Read and concatenate all CSV files
    df_list = [pd.read_csv(file, encoding='latin-1') for file in file_list]
    merged_df = pd.concat(df_list, ignore_index=True)

    # Order the merged DataFrame by 'Datetime' column
    merged_df['datetime'] = pd.to_datetime(merged_df['datetime'], errors='coerce')
    merged_df.sort_values(by='datetime', inplace=True)
    
    # Write the merged DataFrame to a new CSV file
    merged_df.to_csv(output_file, index=False, encoding='latin-1')

if __name__ == "__main__":
    # List of CSV files to merge
    csv_files = [
        'data/Interpolado_jacarepagua.csv',
        'data/Interpolado_Marambaia.csv',
        'data/Interpolado_VilaMilitar.csv'
    ]
    
    # Output file path
    output_csv = 'data/final_dataset.csv'
    
    # Call the function to merge CSV files
    merge_csv_files(csv_files, output_csv)
    print(f"Merged {len(csv_files)} files into {output_csv}")


Merged 3 files into data/final_dataset.csv
