# Eikon DS Loans Filtering Excel Data Based on Sector
This script reads Excel files in a specified directory, filters the data based on the “TRBC Economic Sector Name” field, and writes the filtered data to new Excel files. 
The script is designed to handle Excel files with a specific naming convention and structure.

In [4]:
import pandas as pd
import os

# Directory where your Excel files are located
directory = 'C:/Users/GODLEWSKI/OneDrive - unistra.fr/DATA/THOMSON REUTERS/NEW 2022 + 2024/Loans/eikon DS loans/excel files'

# Loop over the files in the directory
for filename in os.listdir(directory):
    if filename.startswith("_eikon DS loans") and filename.endswith(".xlsx"):
        # Construct the full file path
        file_path = os.path.join(directory, filename)

        # Read the Excel file
        df = pd.read_excel(file_path)

        # Ensure 'TRBC Economic Sector Name' is of type string
        df['TRBC Economic Sector Name'] = df['TRBC Economic Sector Name'].astype(str)

        # Filter out rows where 'TRBC Economic Sector Name' is empty or starts with 'Unable to collect data'
        df = df[df['TRBC Economic Sector Name'].notna() & ~df['TRBC Economic Sector Name'].str.startswith('Unable to collect data')]

        # Filter the data
        financials_df = df[df['TRBC Economic Sector Name'] == 'Financials']
        non_financials_df = df[df['TRBC Economic Sector Name'] != 'Financials']

        # Write the filtered data to new Excel files
        financials_df.to_excel(f"{file_path[:-5]}_financials.xlsx", index=False)
        non_financials_df.to_excel(f"{file_path[:-5]}_non_financials.xlsx", index=False)

        # Print out some information about each file as it's processed
        print(f"Processing file: {file_path}")
        print(f"Number of financial firms: {len(financials_df)}")
        print(f"Number of non-financial firms: {len(non_financials_df)}")


Processing file: C:/Users/GODLEWSKI/OneDrive - unistra.fr/DATA/THOMSON REUTERS/NEW 2022 + 2024/Loans/eikon DS loans/excel files\_eikon DS loans 2020 identification info.xlsx
Number of financial firms: 1097
Number of non-financial firms: 7195
Processing file: C:/Users/GODLEWSKI/OneDrive - unistra.fr/DATA/THOMSON REUTERS/NEW 2022 + 2024/Loans/eikon DS loans/excel files\_eikon DS loans 2021 identification info.xlsx
Number of financial firms: 1649
Number of non-financial firms: 8581
Processing file: C:/Users/GODLEWSKI/OneDrive - unistra.fr/DATA/THOMSON REUTERS/NEW 2022 + 2024/Loans/eikon DS loans/excel files\_eikon DS loans 2022 identification info.xlsx
Number of financial firms: 1709
Number of non-financial firms: 8839
Processing file: C:/Users/GODLEWSKI/OneDrive - unistra.fr/DATA/THOMSON REUTERS/NEW 2022 + 2024/Loans/eikon DS loans/excel files\_eikon DS loans 2023 identification info.xlsx
Number of financial firms: 1498
Number of non-financial firms: 7509
Processing file: C:/Users/GODLEW