In [1]:
from google.colab import drive

In [2]:
drive.mount('/content/drive')

Mounted at /content/drive


In [6]:
import os
import pandas as pd

def extract_outcome(df):
    # Find rows containing "severity" in the "Entity Group" column (case-insensitive and ignoring leading/trailing spaces)
    mask = df["Entity Group"].str.strip().str.lower() == "outcome"

    if mask.any():
        # Get the corresponding "Value" for "severity"
        outcome_values = df.loc[mask, "Value"].values.tolist()
        return outcome_values
    else:
        return []

# Initialize a list to store results
results = []

# Define the path to the input CSV files folder
input_folder_path = '/content/drive/MyDrive/MACROBATT/INPUT_PDF_FILES/'

# Get a list of all files in the folder
input_files = os.listdir(input_folder_path)

# Iterate over each file in the folder
for file_name in input_files:
    # Check if the file is a CSV file
    if file_name.endswith('.csv'):
        # Print the file name
        print("Processing file:", file_name)

        # Construct the full file path
        input_file_path = os.path.join(input_folder_path, file_name)

        # Read the input file using pandas
        df = pd.read_csv(input_file_path)

        # Check if "severity" is present and extract its values (could be multiple)
        outcome_values = extract_outcome(df)

        # Append the file name and severity values to the results list
        results.append((file_name, outcome_values))

# Create a DataFrame from the results list
results_df = pd.DataFrame(results, columns=['File Name', 'outcome'])

# Define the path for the output CSV file
output_csv_path = '/content/drive/MyDrive/MACROBATT/outcome_Results_new.csv'

# Write the results DataFrame to the output CSV file
results_df.to_csv(output_csv_path, index=False)

# Display the results DataFrame
print("Results:")
print(results_df)


Processing file: 25246819_df.csv
Processing file: 25210224_df.csv
Processing file: 25155594_df.csv
Processing file: 24957905_df.csv
Processing file: 24781756_df.csv
Processing file: 24654246_df.csv
Processing file: 24898994_df.csv
Processing file: 24294397_df.csv
Processing file: 24518095_df.csv
Processing file: 25139918_df.csv
Processing file: 24161539_df.csv
Processing file: 24043987_df.csv
Processing file: 25023062_df.csv
Processing file: 25024632_df.csv
Processing file: 23242090_df.csv
Processing file: 24526194_df.csv
Processing file: 23897372_df.csv
Processing file: 23312850_df.csv
Processing file: 23076693_df.csv
Processing file: 23124805_df.csv
Processing file: 23155491_df.csv
Processing file: 23077697_df.csv
Processing file: 23864579_df.csv
Processing file: 23678274_df.csv
Processing file: 22514576_df.csv
Processing file: 21923918_df.csv
Processing file: 22520024_df.csv
Processing file: 22218279_df.csv
Processing file: 23468586_df.csv
Processing file: 23033875_df.csv
Processing