# AutoML & Optimization

Let MKYZ find the best model for your data.

In [1]:
import mkyz
mkyz.init()

mkyz package initialized. Version: 0.2.0
mkyz package initialized. Version: 0.2.0


## 1. Load Diabetes Data

A standard classification dataset.

In [2]:
df = mkyz.load_data('data/diabetes.csv')
X = df.drop('outcome', axis=1)
y = df['outcome']

KeyError: "['outcome'] not found in axis"

## 2. Auto Train

Automatically train and compare multiple models.

In [None]:
# Run models and get leaderboard
results = mkyz.auto_train(X, y, task='classification', timeout=30)

print(f"Best Model: {results['best_model_name']}")
print(f"Score: {results['best_score']:.4f}")

## 3. Hyperparameter Optimization

Optimize a specific model using Grid Search or Bayesian Optimization.

In [None]:
from sklearn.ensemble import RandomForestClassifier

base_model = RandomForestClassifier()
param_grid = {
    'n_estimators': [50, 100, 200],
    'max_depth': [3, 5, 10]
}

# Note: 'method' can be 'grid', 'random', or 'bayesian'
opt_model, best_params = mkyz.optimize_model(
    base_model, 
    X, y, 
    param_grid=param_grid, 
    method='random', 
    n_trials=10
)

print("Best Params:", best_params)