In [2]:
import pandas as pd
import os
import glob

# =========================
# FOLDER PATH
# =========================
input_folder = "fundamental_data"      # folder containing raw CSVs
output_folder = "clean_fundamental_data"

# Create output folder if not exists
os.makedirs(output_folder, exist_ok=True)

# =========================
# INDICATORS TO KEEP
# =========================
relevant_indicators = [
    "Net Sales/Income from operations",
    "Total Income From Operations",
    "Net Profit/(Loss) For the Period",
    "P/L Before Tax",
    "Interest",
    "Depreciation",
    "Basic EPS",
    "Equity Share Capital"
]

# =========================
# PROCESS ALL CSV FILES
# =========================
files = glob.glob(os.path.join(input_folder, "*.csv"))

for input_file in files:

    print("Processing:", input_file)

    df = pd.read_csv(input_file)

    # Clean column names
    df.columns = df.columns.str.strip()

    # Filter relevant rows
    filtered = df[df["Indicators"].isin(relevant_indicators)]

    # Transpose
    filtered.set_index("Indicators", inplace=True)
    clean_df = filtered.T

    # Reset index
    clean_df.reset_index(inplace=True)
    clean_df.rename(columns={"index": "Quarter"}, inplace=True)

    # =========================
    # OUTPUT FILE NAME
    # =========================
    filename = os.path.basename(input_file)
    output_file = os.path.join(output_folder, filename.replace(".csv", "_clean.csv"))

    clean_df.to_csv(output_file, index=False)

    print("âœ… Saved:", output_file)

print("\nðŸŽ‰ All files processed successfully!")


Processing: fundamental_data\reliance_fundamentals.csv
âœ… Saved: clean_fundamental_data\reliance_fundamentals_clean.csv

ðŸŽ‰ All files processed successfully!
