In [2]:
!pip install pandas



In [3]:
import pandas as pd
import os

In [None]:
def merge_csv_files(input_folder, output_csv_path):
  """
    Goes through a folder, finds all CSV files, reads them into DataFrames,
    merges them all together, and saves one big CSV file.

    Args:
        input_folder (str): The path to the folder containing your CSV files.
        output_csv_path (str): The full path (including filename) for the merged CSV output.

    Returns:
        None. Just saves the merged CSV file.
    """
    # List to hold all DataFrames that we’ll combine

    dfs = []
    # Loop through all files in the folder

    for file_name in os.listdir(input_folder):
      # Only work with CSV files
        if file_name.endswith('.csv'):
            file_path = os.path.join(input_folder, file_name)
            try:
              # Try to read the CSV file
                df = pd.read_csv(file_path)
                # Only add it if it's not completely empty
                if not df.empty:
                    dfs.append(df)
                else:
                    print(f"Skipped empty file: {file_name}")
            except pd.errors.EmptyDataError:
              # If it's unreadable or malformed, skip it
                print(f"Skipped empty or malformed file: {file_name}")

    # Once we’ve gathered everything, merge and save
    if dfs:
        # Combine into one big DataFrame
        merged_df = pd.concat(dfs, ignore_index=True)
        # Save to CSV without row numbers
        merged_df.to_csv(output_csv_path, index=False)
        print(f"Merged CSV saved at: {output_csv_path}")
    else:
        print("No valid CSV files found to merge.")

# Example usage: Just plug in the folder where your separate CSVs are
input_folder = '/content/drive/MyDrive/GW Semesters/Sem 2/ML by Prof Shi Feng/ML Sem Project - Fake Review Detector/FakeReviewShield/Final Datasets'
# Your folder path
output_csv_path = '/content/drive/MyDrive/GW Semesters/Sem 2/ML by Prof Shi Feng/ML Sem Project - Fake Review Detector/FakeReviewShield/Final Datasets/merged_output.csv'

# Run the merging function
merge_csv_files(input_folder, output_csv_path)
