In [None]:

# Generalized Code for LightGBM

# 1. Importing Libraries
import numpy as np
import pandas as pd
import lightgbm as lgb
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_absolute_error, r2_score, mean_squared_error

# 2. Loading Dataset Function
def load_dataset(file_path):
    return pd.read_csv(file_path)

# 3. Preprocessing Function
def preprocess_data(df, target_col, drop_columns=[]):
    df = df.drop(columns=drop_columns, errors='ignore')
    df.columns = df.columns.str.lower()
    
    X = df.drop(columns=target_col, errors='ignore')
    y = df[target_col]
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
    
    return X_train, X_test, y_train, y_test

# 4. Model Training and Prediction Function
def train_and_predict(X_train, y_train):
    model = lgb.LGBMRegressor(n_estimators=100, learning_rate=0.1, max_depth=3)
    model.fit(X_train, y_train)
    y_train_pred = model.predict(X_train)
    y_test_pred = model.predict(X_test)
    return model, y_train_pred, y_test_pred

# 5. Evaluation Function
def evaluate_model(true, predicted):
    mae = mean_absolute_error(true, predicted)
    mse = mean_squared_error(true, predicted)
    rmse = np.sqrt(mse)
    r2 = r2_score(true, predicted)
    return mae, mse, rmse, r2

# 6. Main Execution
if __name__ == "__main__":
    df = load_dataset('path_to_your_dataset.csv')
    X_train, X_test, y_train, y_test = preprocess_data(df, target_col='your_target_column', drop_columns=['columns_to_drop'])
    model, y_train_pred, y_test_pred = train_and_predict(X_train, y_train)
    
    train_mae, train_mse, train_rmse, train_r2 = evaluate_model(y_train, y_train_pred)
    test_mae, test_mse, test_rmse, test_r2 = evaluate_model(y_test, y_test_pred)
    
    print(f'Train set evaluation:\nMAE={train_mae}, MSE={train_mse}, RMSE={train_rmse}, R2={train_r2}')
    print(f'Test set evaluation:\nMAE={test_mae}, MSE={test_mse}, RMSE={test_rmse}, R2={test_r2}')
