In [1]:
# Ridge Regression Example
from sklearn.linear_model import Ridge
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error, r2_score
from sklearn.datasets import load_diabetes
import pandas as pd

# Load sample dataset
data = load_diabetes()
X = pd.DataFrame(data.data, columns=data.feature_names)
y = data.target

# Split data
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Train Ridge Regression model
ridge = Ridge(alpha=1.0)
ridge.fit(X_train, y_train)

# Predictions
y_pred = ridge.predict(X_test)

# Evaluation
print("R^2 Score:", r2_score(y_test, y_pred))
print("MSE:", mean_squared_error(y_test, y_pred))
print("Coefficients:", ridge.coef_)

R^2 Score: 0.41915292635986545
MSE: 3077.41593882723
Coefficients: [  45.36737726  -76.66608563  291.33883165  198.99581745   -0.53030959
  -28.57704987 -144.51190505  119.26006559  230.22160832  112.14983004]


In [2]:
# Ridge Regression Example with Boston Housing
from sklearn.linear_model import Ridge
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error, r2_score
from sklearn.datasets import fetch_california_housing  # alternative to Boston
import pandas as pd

# Load sample dataset
data = fetch_california_housing()
X = pd.DataFrame(data.data, columns=data.feature_names)
y = data.target

# Split data
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Train Ridge Regression model
ridge = Ridge(alpha=1.0)
ridge.fit(X_train, y_train)

# Predictions
y_pred = ridge.predict(X_test)

# Evaluation
print("R^2 Score:", r2_score(y_test, y_pred))
print("MSE:", mean_squared_error(y_test, y_pred))
print("Coefficients:", ridge.coef_)


R^2 Score: 0.5758549611440126
MSE: 0.5558034669932211
Coefficients: [ 4.48510924e-01  9.72596535e-03 -1.23014157e-01  7.81416761e-01
 -2.02581346e-06 -3.52585878e-03 -4.19786908e-01 -4.33680793e-01]


In [4]:
# Fully Automated Ridge Regression for Any Sklearn Regression Dataset
from sklearn.linear_model import Ridge
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error, r2_score
from sklearn import datasets
import pandas as pd

# ===== List of available sklearn regression datasets =====
regression_datasets = {
    "diabetes": datasets.load_diabetes,
    "california_housing": datasets.fetch_california_housing,
}

# ===== Pick a dataset =====
print("Available datasets:", list(regression_datasets.keys()))
dataset_choice = "california_housing"  # change or input dynamically

if dataset_choice not in regression_datasets:
    raise ValueError("Dataset not available")

# Load the dataset
data_func = regression_datasets[dataset_choice]
data = data_func()

# Convert to DataFrame
X = pd.DataFrame(data.data, columns=data.feature_names)
y = data.target

# Split data
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Train Ridge Regression
ridge = Ridge(alpha=1.0)
ridge.fit(X_train, y_train)

# Predict
y_pred = ridge.predict(X_test)

# Evaluation
print(f"\nDataset: {dataset_choice}")
print("R^2 Score:", r2_score(y_test, y_pred))
print("MSE:", mean_squared_error(y_test, y_pred))
print("Coefficients:", ridge.coef_)

Available datasets: ['diabetes', 'california_housing']

Dataset: california_housing
R^2 Score: 0.5758549611440126
MSE: 0.5558034669932211
Coefficients: [ 4.48510924e-01  9.72596535e-03 -1.23014157e-01  7.81416761e-01
 -2.02581346e-06 -3.52585878e-03 -4.19786908e-01 -4.33680793e-01]
