# Feature Engineering for Epileptic Seizure Recognition Dataset

In [None]:

import pandas as pd

def load_and_preprocess(file_path):
    # Load dataset
    df = pd.read_csv(file_path)
    
    # Drop the unnamed column (ID-like)
    df.drop(columns=['Unnamed'], inplace=True, errors='ignore')
    
    # Separate features and target
    X = df.drop(columns=['y'])
    y = df['y']
    
    # Standardize numerical features manually
    X_scaled = (X - X.mean()) / X.std()
    
    # Remove outliers using the IQR method
    Q1 = X_scaled.quantile(0.25)
    Q3 = X_scaled.quantile(0.75)
    IQR = Q3 - Q1
    X_filtered = X_scaled[~((X_scaled < (Q1 - 1.5 * IQR)) | (X_scaled > (Q3 + 1.5 * IQR))).any(axis=1)]
    y_filtered = y.loc[X_filtered.index]
    
    return X_filtered, y_filtered

# File path
file_path = "Epileptic_Seizure_Recognition.csv"

# Process dataset
X_processed, y_processed = load_and_preprocess(file_path)

# Save processed data
X_processed.to_csv("processed_features.csv", index=False)
y_processed.to_csv("processed_target.csv", index=False)

print("Feature engineering complete. Processed data saved.")
