In [None]:
from sklearn.ensemble import AdaBoostRegressor
from sklearn.model_selection import GridSearchCV, KFold, train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import mean_squared_error, r2_score, mean_absolute_percentage_error
import pandas as pd
import numpy as np

# Load dataset
df = pd.read_excel('/content/T5.xlsx')

# Features and target
X = df.drop(columns=['putting marks'])
y = df['putting marks']

# Split the data
X_train_full, X_test, y_train_full, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Normalize the data
scaler = StandardScaler()
X_train_full_scaled = scaler.fit_transform(X_train_full)
X_test_scaled = scaler.transform(X_test)

# Define parameter grid for GridSearchCV
param_grid = {
    'n_estimators': [50, 100, 200],
    'learning_rate': [0.01, 0.1, 0.5, 1.0]
}

# Initialize AdaBoost Regressor
model = AdaBoostRegressor(random_state=42)

# Set up K-Fold cross-validation
kf = KFold(n_splits=10, shuffle=True, random_state=42)

# Initialize GridSearchCV
grid_search = GridSearchCV(estimator=model, param_grid=param_grid, cv=kf, scoring='neg_mean_squared_error', n_jobs=-1)

# Fit the model with GridSearchCV
grid_search.fit(X_train_full_scaled, y_train_full)

# Get the best estimator
best_model = grid_search.best_estimator_
print(f"Best Parameters for AdaBoost: {grid_search.best_params_}\n")

# Predict on both training and test sets with the best model
y_train_pred = best_model.predict(X_train_full_scaled)
y_test_pred = best_model.predict(X_test_scaled)

# Calculate metrics for the training set
mse_train = mean_squared_error(y_train_full, y_train_pred)
rmse_train = np.sqrt(mse_train)
r2_train = r2_score(y_train_full, y_train_pred)
mape_train = mean_absolute_percentage_error(y_train_full, y_train_pred) * 100

# Print training set metrics
print("Training Set Metrics for AdaBoost:")
print(f"MSE: {mse_train}")
print(f"RMSE: {rmse_train}")
print(f"R2: {r2_train}")
print(f"MAPE: {mape_train}\n")

# Calculate metrics for the test set
mse_test = mean_squared_error(y_test, y_test_pred)
rmse_test = np.sqrt(mse_test)
r2_test = r2_score(y_test, y_test_pred)
mape_test = mean_absolute_percentage_error(y_test, y_test_pred) * 100

# Print test set metrics
print("Test Set Metrics for AdaBoost:")
print(f"MSE: {mse_test}")
print(f"RMSE: {rmse_test}")
print(f"R2: {r2_test}")
print(f"MAPE: {mape_test}\n")


Best Parameters for AdaBoost: {'learning_rate': 0.1, 'n_estimators': 200}

Training Set Metrics for AdaBoost:
MSE: 0.9835039412839814
RMSE: 0.9917176721648059
R2: 0.7316737861565025
MAPE: 1.1786059758027426e+17

Test Set Metrics for AdaBoost:
MSE: 1.7250156022941823
RMSE: 1.3133984933348226
R2: 0.47527096106443134
MAPE: 1.2628860331504637e+17



In [1]:
from sklearn.ensemble import AdaBoostRegressor
from sklearn.model_selection import GridSearchCV, KFold, train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import mean_squared_error, r2_score, mean_absolute_percentage_error
import pandas as pd
import numpy as np

# Load dataset
df = pd.read_excel('/content/drive/MyDrive/ML Files/Codebert (1).xlsx')

# Features and target
X = df.drop(columns=['putting marks'])
y = df['putting marks']

# Split the data
X_train_full, X_test, y_train_full, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Normalize the data
scaler = StandardScaler()
X_train_full_scaled = scaler.fit_transform(X_train_full)
X_test_scaled = scaler.transform(X_test)

# Define parameter grid for GridSearchCV
param_grid = {
    'n_estimators': [50, 100, 200],
    'learning_rate': [0.01, 0.1, 0.5, 1.0]
}

# Initialize AdaBoost Regressor
model = AdaBoostRegressor(random_state=42)

# Set up K-Fold cross-validation
kf = KFold(n_splits=10, shuffle=True, random_state=42)

# Initialize GridSearchCV
grid_search = GridSearchCV(estimator=model, param_grid=param_grid, cv=kf, scoring='neg_mean_squared_error', n_jobs=-1)

# Fit the model with GridSearchCV
grid_search.fit(X_train_full_scaled, y_train_full)

# Get the best estimator
best_model = grid_search.best_estimator_
print(f"Best Parameters for AdaBoost: {grid_search.best_params_}\n")

# Predict on both training and test sets with the best model
y_train_pred = best_model.predict(X_train_full_scaled)
y_test_pred = best_model.predict(X_test_scaled)

# Calculate metrics for the training set
mse_train = mean_squared_error(y_train_full, y_train_pred)
rmse_train = np.sqrt(mse_train)
r2_train = r2_score(y_train_full, y_train_pred)
mape_train = mean_absolute_percentage_error(y_train_full, y_train_pred) * 100

# Print training set metrics
print("Training Set Metrics for AdaBoost:")
print(f"MSE: {mse_train}")
print(f"RMSE: {rmse_train}")
print(f"R2: {r2_train}")
print(f"MAPE: {mape_train}\n")

# Calculate metrics for the test set
mse_test = mean_squared_error(y_test, y_test_pred)
rmse_test = np.sqrt(mse_test)
r2_test = r2_score(y_test, y_test_pred)
mape_test = mean_absolute_percentage_error(y_test, y_test_pred) * 100

# Print test set metrics
print("Test Set Metrics for AdaBoost:")
print(f"MSE: {mse_test}")
print(f"RMSE: {rmse_test}")
print(f"R2: {r2_test}")
print(f"MAPE: {mape_test}\n")


Best Parameters for AdaBoost: {'learning_rate': 0.1, 'n_estimators': 200}

Training Set Metrics for AdaBoost:
MSE: 1.0208242912431644
RMSE: 1.010358496397771
R2: 0.7214917952325124
MAPE: 1.0851290065462243e+17

Test Set Metrics for AdaBoost:
MSE: 1.8653909543344314
RMSE: 1.3657931594258448
R2: 0.43257046405538435
MAPE: 1.4486210399988022e+17



In [2]:
from sklearn.ensemble import AdaBoostRegressor
from sklearn.model_selection import GridSearchCV, KFold, train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import mean_squared_error, r2_score, mean_absolute_percentage_error
import pandas as pd
import numpy as np

# Load dataset
df = pd.read_excel('/content/drive/MyDrive/ML Files/Mathbert (1).xlsx')

# Features and target
X = df.drop(columns=['putting marks'])
y = df['putting marks']

# Split the data
X_train_full, X_test, y_train_full, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Normalize the data
scaler = StandardScaler()
X_train_full_scaled = scaler.fit_transform(X_train_full)
X_test_scaled = scaler.transform(X_test)

# Define parameter grid for GridSearchCV
param_grid = {
    'n_estimators': [50, 100, 200],
    'learning_rate': [0.01, 0.1, 0.5, 1.0]
}

# Initialize AdaBoost Regressor
model = AdaBoostRegressor(random_state=42)

# Set up K-Fold cross-validation
kf = KFold(n_splits=10, shuffle=True, random_state=42)

# Initialize GridSearchCV
grid_search = GridSearchCV(estimator=model, param_grid=param_grid, cv=kf, scoring='neg_mean_squared_error', n_jobs=-1)

# Fit the model with GridSearchCV
grid_search.fit(X_train_full_scaled, y_train_full)

# Get the best estimator
best_model = grid_search.best_estimator_
print(f"Best Parameters for AdaBoost: {grid_search.best_params_}\n")

# Predict on both training and test sets with the best model
y_train_pred = best_model.predict(X_train_full_scaled)
y_test_pred = best_model.predict(X_test_scaled)

# Calculate metrics for the training set
mse_train = mean_squared_error(y_train_full, y_train_pred)
rmse_train = np.sqrt(mse_train)
r2_train = r2_score(y_train_full, y_train_pred)
mape_train = mean_absolute_percentage_error(y_train_full, y_train_pred) * 100

# Print training set metrics
print("Training Set Metrics for AdaBoost:")
print(f"MSE: {mse_train}")
print(f"RMSE: {rmse_train}")
print(f"R2: {r2_train}")
print(f"MAPE: {mape_train}\n")

# Calculate metrics for the test set
mse_test = mean_squared_error(y_test, y_test_pred)
rmse_test = np.sqrt(mse_test)
r2_test = r2_score(y_test, y_test_pred)
mape_test = mean_absolute_percentage_error(y_test, y_test_pred) * 100

# Print test set metrics
print("Test Set Metrics for AdaBoost:")
print(f"MSE: {mse_test}")
print(f"RMSE: {rmse_test}")
print(f"R2: {r2_test}")
print(f"MAPE: {mape_test}\n")


Best Parameters for AdaBoost: {'learning_rate': 0.1, 'n_estimators': 200}

Training Set Metrics for AdaBoost:
MSE: 0.9635738424715184
RMSE: 0.981617971754551
R2: 0.7371112508492147
MAPE: 1.0472072635390595e+17

Test Set Metrics for AdaBoost:
MSE: 1.5673782284206237
RMSE: 1.251949770725896
R2: 0.5232223578999092
MAPE: 1.2402079050692106e+17

