In [None]:

# Generalized Code for Surrogate Models

# 1. Importing Libraries
import numpy as np
import pandas as pd
from sklearn.ensemble import RandomForestClassifier, RandomForestRegressor
from sklearn.tree import DecisionTreeClassifier, plot_tree
from sklearn.model_selection import train_test_split

# 2. Loading Dataset Function
def load_dataset(file_path):
    return pd.read_csv(file_path)

# 3. Preprocessing Function
def preprocess_data(df, target_col):
    df = df.copy()
    df.columns = df.columns.str.lower()
    X = df.drop(columns=[target_col])
    y = df[target_col]
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
    
    return X_train, X_test, y_train, y_test

# 4. Model Training
def train_model(X_train, y_train):
    model = RandomForestClassifier(n_estimators=100)
    model.fit(X_train, y_train)
    return model

# 5. Surrogate Model Training and Visualization
def train_and_plot_surrogate(X_train, model_predictions):
    surrogate = DecisionTreeClassifier(max_depth=4)
    surrogate.fit(X_train, model_predictions)
    
    plt.figure(figsize=(20,10))
    plot_tree(surrogate, filled=True, feature_names=X_train.columns, class_names=surrogate.classes_, rounded=True)
    plt.show()

# 6. Main Execution
if __name__ == "__main__":
    df = load_dataset('path_to_your_dataset.csv')
    X_train, X_test, y_train, y_test = preprocess_data(df, target_col='your_target_column')
    model = train_model(X_train, y_train)
    model_predictions = model.predict(X_train)
    train_and_plot_surrogate(X_train, model_predictions)
