In [None]:
import os
import pandas as pd

# Directory where the CSV files are stored
directory = '/content'

# Prepare a list to collect results
results_summary = []

# Iterate over counters "001" to "100"
for counter in range(1, 101):
    counter_str = f"{counter:03}"  # Format counter with leading zeros

    filename = f"{counter_str}.csv"
    file_path = os.path.join(directory, filename)

    if os.path.exists(file_path):
        # Read the CSV file
        df = pd.read_csv(file_path)

        # Check if 'prediction' column exists
        if 'prediction' in df.columns:
            # Count the number of positive and negative comments
            positive_count = df['prediction'].value_counts().get('positive', 0)
            total_count = len(df['prediction'])
            positive_percentage = (positive_count / total_count) * 100 if total_count > 0 else 0

            # Append the results to the summary list
            results_summary.append({'filename': filename, 'positive_percentage': positive_percentage})

            print(f"File: {filename}, Positive Percentage: {positive_percentage:.2f}%")
        else:
            print(f"'prediction' column not found in {filename}, skipping file.")
    else:
        print(f"File {filename} does not exist.")

# Create a DataFrame from the summary results
summary_df = pd.DataFrame(results_summary)

# Save the summary DataFrame to a new CSV file
summary_df.to_csv(os.path.join(directory, 'summary_results.csv'), index=False)

print("Summary results saved to 'summary_results.csv'")