In [1]:
# Importing necessary packages
import numpy as np 
import pandas as pd
import os
import warnings

warnings.filterwarnings('ignore')

In [5]:

# Define the source and destination root folders (relative to this script)
source_root = '../data'
destination_root = '../Preprocessed_Data'

# Define the three categories
categories = ['Large_Cap', 'Mid_Cap', 'Small_Cap']

for category in categories:
    source_path = os.path.join(source_root, category)
    destination_path = os.path.join(destination_root, category)

    # Check if the source path exists before proceeding
    if not os.path.exists(source_path):
        print(f"Source folder not found: {source_path}")
        continue

    # Create destination directory if it doesn't exist
    os.makedirs(destination_path, exist_ok=True)

    # Loop through all CSV files in the source category folder
    for file_name in os.listdir(source_path):
        if file_name.endswith('.csv'):
            full_file_path = os.path.join(source_path, file_name)

            # Read the CSV file
            df = pd.read_csv(full_file_path)

            # Filter rows where Series column is 'EQ'
            if 'Series' in df.columns:
                df = df[df.Series == 'EQ']

            # Drop missing values
            df.dropna(inplace=True)

            # Save the preprocessed file
            output_file_path = os.path.join(destination_path, file_name)
            df.to_csv(output_file_path, index=False)

            print(f"Processed and saved: {output_file_path}")


Processed and saved: ../Preprocessed_Data\Large_Cap\ADANIPORTS.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\ASIANPAINT.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\AXISBANK.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\BAJFINANCE.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\BPCL.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\CIPLA.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\DRREDDY.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\EICHERMOT.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\GAIL.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\HDFC.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\HDFCBANK.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\HEROMOTOCO.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\HINDALCO.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\HINDUNILVR.csv
Processed and saved: ../Preprocessed_Data\Large_Cap\INFRATEL.csv
Processed and saved: ../Prepro