In [1]:
!pip install git+https://github.com/thierrymoudiki/unifiedbooster.git --upgrade

Collecting git+https://github.com/thierrymoudiki/unifiedbooster.git
  Cloning https://github.com/thierrymoudiki/unifiedbooster.git to /tmp/pip-req-build-bfnp1r_b
  Running command git clone --filter=blob:none --quiet https://github.com/thierrymoudiki/unifiedbooster.git /tmp/pip-req-build-bfnp1r_b
  Resolved https://github.com/thierrymoudiki/unifiedbooster.git to commit e45d844a6745f244a88f5979c70924ed1afe3860
  Preparing metadata (setup.py) ... [?25l[?25hdone
Collecting catboost (from unifiedbooster==0.1.2)
  Downloading catboost-1.2.5-cp310-cp310-manylinux2014_x86_64.whl.metadata (1.2 kB)
Collecting nvidia-nccl-cu12 (from xgboost->unifiedbooster==0.1.2)
  Downloading nvidia_nccl_cu12-2.22.3-py3-none-manylinux2014_x86_64.whl.metadata (1.8 kB)
Downloading catboost-1.2.5-cp310-cp310-manylinux2014_x86_64.whl (98.2 MB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m98.2/98.2 MB[0m [31m5.7 MB/s[0m eta [36m0:00:00[0m
[?25hDownloading nvidia_nccl_cu12-2.22.3-py3-none-ma

In [2]:
import unifiedbooster as ub
from sklearn.datasets import load_iris, load_breast_cancer, load_wine
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score

datasets = [load_iris(), load_breast_cancer(), load_wine()]

for dataset in datasets:

  X, y = dataset.data, dataset.target
  X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

  # Initialize the unified regressor (example with XGBoost)
  regressor1 = ub.GBDTClassifier(model_type='xgboost')
  regressor2 = ub.GBDTClassifier(model_type='catboost')
  regressor3 = ub.GBDTClassifier(model_type='lightgbm')

  # Fit the model
  regressor1.fit(X_train, y_train)
  regressor2.fit(X_train, y_train)
  regressor3.fit(X_train, y_train)

  # Predict on the test set
  y_pred1 = regressor1.predict(X_test)
  y_pred2 = regressor2.predict(X_test)
  y_pred3 = regressor3.predict(X_test)

  # Evaluate the model
  accuracy1 = accuracy_score(y_test, y_pred1)
  accuracy2 = accuracy_score(y_test, y_pred2)
  accuracy3 = accuracy_score(y_test, y_pred3)
  print(f"Classification Accuracy xgboost: {accuracy1:.2f}")
  print(f"Classification Accuracy catboost: {accuracy2:.2f}")
  print(f"Classification Accuracy lightgbm: {accuracy3:.2f}")

Dask dataframe query planning is disabled because dask-expr is not installed.

You can install it with `pip install dask[dataframe]` or `conda install dask`.
This will raise in a future version.



Classification Accuracy xgboost: 1.00
Classification Accuracy catboost: 1.00
Classification Accuracy lightgbm: 1.00
Classification Accuracy xgboost: 0.96
Classification Accuracy catboost: 0.97
Classification Accuracy lightgbm: 0.96
Classification Accuracy xgboost: 0.97
Classification Accuracy catboost: 1.00
Classification Accuracy lightgbm: 1.00


In [3]:
import numpy as np

In [4]:
import unifiedbooster as ub
from sklearn.datasets import fetch_california_housing, load_diabetes
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error


datasets = [fetch_california_housing(), load_diabetes()]

for dataset in datasets:

  # Load dataset
  X, y = dataset.data, dataset.target

  # Split dataset into training and testing sets
  X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

  # Initialize the unified regressor (example with XGBoost)
  regressor1 = ub.GBDTRegressor(model_type='xgboost')
  regressor2 = ub.GBDTRegressor(model_type='catboost')
  regressor3 = ub.GBDTRegressor(model_type='lightgbm')

  # Fit the model
  regressor1.fit(X_train, y_train)
  regressor2.fit(X_train, y_train)
  regressor3.fit(X_train, y_train)

  # Predict on the test set
  y_pred1 = regressor1.predict(X_test)
  y_pred2 = regressor2.predict(X_test)
  y_pred3 = regressor3.predict(X_test)

  # Evaluate the model
  mse1 = np.sqrt(mean_squared_error(y_test, y_pred1))
  mse2 = np.sqrt(mean_squared_error(y_test, y_pred2))
  mse3 = np.sqrt(mean_squared_error(y_test, y_pred3))
  print(f"Regression Root Mean Squared Error xgboost: {mse1:.2f}")
  print(f"Regression Root Mean Squared Error catboost: {mse2:.2f}")
  print(f"Regression Root Mean Squared Error lightgbm: {mse3:.2f}")

Regression Root Mean Squared Error xgboost: 0.54
Regression Root Mean Squared Error catboost: 0.58
Regression Root Mean Squared Error lightgbm: 0.54
Regression Root Mean Squared Error xgboost: 54.40
Regression Root Mean Squared Error catboost: 51.72
Regression Root Mean Squared Error lightgbm: 53.19
