In [3]:
import pandas as pd
import numpy as np
import xgboost as xgb
from sklearn.model_selection import RandomizedSearchCV, StratifiedKFold
from sklearn.metrics import classification_report

# Load transformed data
X_train = pd.read_csv('data/training_data_transformed.csv')
y_train = pd.read_csv('data/y_train_transformed.csv').values.ravel()
X_test = pd.read_csv('data/test_data_transformed.csv')

# Drop non-numeric columns
for col in X_train.columns:
    if X_train[col].dtype == 'object':
        print(f"Dropping column: {col}")
        X_train = X_train.drop(columns=[col])
        X_test = X_test.drop(columns=[col])

# Define parameter grid for random search
param_dist = {
    'n_estimators': [100, 200, 300],
    'max_depth': [3, 5, 7, 10],
    'learning_rate': [0.01, 0.05, 0.1, 0.2],
    'subsample': [0.7, 0.8, 1.0],
    'colsample_bytree': [0.7, 0.8, 1.0],
    'gamma': [0, 0.1, 0.2, 0.5]
}

# Set up cross-validation
cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)

# Randomized search
xgb_clf = xgb.XGBClassifier(use_label_encoder=False, eval_metric='mlogloss', random_state=42)
random_search = RandomizedSearchCV(
    xgb_clf,
    param_distributions=param_dist,
    n_iter=20,
    scoring='accuracy',
    cv=cv,
    verbose=2,
    n_jobs=-1
)
random_search.fit(X_train, y_train)

print("Best parameters found:", random_search.best_params_)
print("Best cross-validation score:", random_search.best_score_)

# Train best model on all data
best_model = random_search.best_estimator_
best_model.fit(X_train, y_train)

# Predict on test data
y_pred = best_model.predict(X_test)

# Convert predictions back to original labels
from sklearn.preprocessing import OrdinalEncoder
target_order = ['None_Existent', 'Low', 'Medium', 'High', 'Very_High']
oe_target = OrdinalEncoder(categories=[target_order])
oe_target.fit(np.array(target_order).reshape(-1, 1))
y_pred_labels = oe_target.inverse_transform(y_pred.reshape(-1, 1))

# Save submission CSV with ID column
submission = pd.DataFrame({
    'RowId': np.arange(1, len(y_pred_labels) + 1),
    'AVERAGE_SPEED_DIFF': y_pred_labels.ravel()
})
submission['AVERAGE_SPEED_DIFF'] = submission['AVERAGE_SPEED_DIFF'].replace('None_Existent', 'None')
submission.to_csv('submission.csv', index=False)
print('✅ Submission file with ID saved as submission.csv')

Dropping column: record_date
Fitting 5 folds for each of 20 candidates, totalling 100 fits


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.1, max_depth=10, n_estimators=200, subsample=0.7; total time=   2.5s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.1, max_depth=10, n_estimators=200, subsample=0.7; total time=   2.8s
[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.1, max_depth=10, n_estimators=200, subsample=0.7; total time=   2.8s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.1, max_depth=10, n_estimators=200, subsample=0.7; total time=   3.2s
[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.1, max_depth=10, n_estimators=200, subsample=0.7; total time=   3.3s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0.5, learning_rate=0.01, max_depth=5, n_estimators=300, subsample=0.8; total time=   4.2s
[CV] END colsample_bytree=1.0, gamma=0.5, learning_rate=0.01, max_depth=5, n_estimators=300, subsample=0.8; total time=   4.3s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.1, learning_rate=0.1, max_depth=3, n_estimators=200, subsample=0.8; total time=   1.7s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0.5, learning_rate=0.01, max_depth=5, n_estimators=300, subsample=0.8; total time=   4.8s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.1, learning_rate=0.1, max_depth=3, n_estimators=200, subsample=0.8; total time=   2.2s
[CV] END colsample_bytree=0.7, gamma=0.1, learning_rate=0.1, max_depth=3, n_estimators=200, subsample=0.8; total time=   2.2s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.1, learning_rate=0.1, max_depth=3, n_estimators=200, subsample=0.8; total time=   1.6s
[CV] END colsample_bytree=0.7, gamma=0.1, learning_rate=0.1, max_depth=3, n_estimators=200, subsample=0.8; total time=   1.7s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0.5, learning_rate=0.01, max_depth=5, n_estimators=300, subsample=0.8; total time=   3.5s
[CV] END colsample_bytree=1.0, gamma=0, learning_rate=0.01, max_depth=3, n_estimators=200, subsample=0.8; total time=   1.6s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0, learning_rate=0.01, max_depth=3, n_estimators=200, subsample=0.8; total time=   1.8s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0.5, learning_rate=0.01, max_depth=5, n_estimators=300, subsample=0.8; total time=   4.3s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0, learning_rate=0.01, max_depth=3, n_estimators=200, subsample=0.8; total time=   1.9s
[CV] END colsample_bytree=1.0, gamma=0, learning_rate=0.01, max_depth=3, n_estimators=200, subsample=0.8; total time=   2.0s
[CV] END colsample_bytree=1.0, gamma=0, learning_rate=0.01, max_depth=3, n_estimators=200, subsample=0.8; total time=   1.8s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.1, learning_rate=0.1, max_depth=5, n_estimators=300, subsample=0.8; total time=   3.4s
[CV] END colsample_bytree=0.8, gamma=0.1, learning_rate=0.1, max_depth=5, n_estimators=300, subsample=0.8; total time=   3.4s
[CV] END colsample_bytree=0.8, gamma=0, learning_rate=0.01, max_depth=7, n_estimators=100, subsample=0.8; total time=   2.1s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0, learning_rate=0.01, max_depth=7, n_estimators=100, subsample=0.8; total time=   2.3s
[CV] END colsample_bytree=0.8, gamma=0.1, learning_rate=0.1, max_depth=5, n_estimators=300, subsample=0.8; total time=   3.3s
[CV] END colsample_bytree=0.8, gamma=0, learning_rate=0.01, max_depth=7, n_estimators=100, subsample=0.8; total time=   2.3s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.1, learning_rate=0.1, max_depth=5, n_estimators=300, subsample=0.8; total time=   4.6s
[CV] END colsample_bytree=0.8, gamma=0.1, learning_rate=0.1, max_depth=5, n_estimators=300, subsample=0.8; total time=   3.6s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0, learning_rate=0.01, max_depth=7, n_estimators=100, subsample=0.8; total time=   2.1s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0, learning_rate=0.01, max_depth=7, n_estimators=100, subsample=0.8; total time=   2.9s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.5, learning_rate=0.2, max_depth=10, n_estimators=200, subsample=0.7; total time=   2.1s
[CV] END colsample_bytree=1.0, gamma=0.2, learning_rate=0.1, max_depth=7, n_estimators=200, subsample=0.7; total time=   3.5s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0.2, learning_rate=0.1, max_depth=7, n_estimators=200, subsample=0.7; total time=   3.3s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.5, learning_rate=0.2, max_depth=10, n_estimators=200, subsample=0.7; total time=   2.2s
[CV] END colsample_bytree=1.0, gamma=0.2, learning_rate=0.1, max_depth=7, n_estimators=200, subsample=0.7; total time=   3.2s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0.2, learning_rate=0.1, max_depth=7, n_estimators=200, subsample=0.7; total time=   4.0s
[CV] END colsample_bytree=1.0, gamma=0.2, learning_rate=0.1, max_depth=7, n_estimators=200, subsample=0.7; total time=   4.0s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.5, learning_rate=0.2, max_depth=10, n_estimators=200, subsample=0.7; total time=   2.3s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.5, learning_rate=0.2, max_depth=10, n_estimators=200, subsample=0.7; total time=   2.0s
[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.05, max_depth=3, n_estimators=200, subsample=1.0; total time=   1.4s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.05, max_depth=3, n_estimators=200, subsample=1.0; total time=   1.4s
[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.05, max_depth=3, n_estimators=200, subsample=1.0; total time=   2.4s
[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.05, max_depth=3, n_estimators=200, subsample=1.0; total time=   1.7s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.05, max_depth=3, n_estimators=200, subsample=1.0; total time=   1.6s
[CV] END colsample_bytree=0.8, gamma=0.5, learning_rate=0.2, max_depth=10, n_estimators=200, subsample=0.7; total time=   2.8s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.2, learning_rate=0.05, max_depth=10, n_estimators=100, subsample=0.7; total time=   3.0s
[CV] END colsample_bytree=0.8, gamma=0.2, learning_rate=0.05, max_depth=10, n_estimators=100, subsample=0.7; total time=   2.9s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.2, learning_rate=0.05, max_depth=10, n_estimators=100, subsample=0.7; total time=   3.8s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0, learning_rate=0.05, max_depth=7, n_estimators=300, subsample=1.0; total time=   5.2s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0, learning_rate=0.05, max_depth=7, n_estimators=300, subsample=1.0; total time=   5.1s
[CV] END colsample_bytree=1.0, gamma=0, learning_rate=0.05, max_depth=7, n_estimators=300, subsample=1.0; total time=   5.5s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0, learning_rate=0.05, max_depth=7, n_estimators=300, subsample=1.0; total time=   5.8s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0, learning_rate=0.05, max_depth=7, n_estimators=300, subsample=1.0; total time=   5.9s
[CV] END colsample_bytree=0.8, gamma=0.2, learning_rate=0.05, max_depth=10, n_estimators=100, subsample=0.7; total time=   2.8s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.2, learning_rate=0.05, max_depth=10, n_estimators=100, subsample=0.7; total time=   3.6s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.1, learning_rate=0.05, max_depth=5, n_estimators=100, subsample=0.7; total time=   1.3s
[CV] END colsample_bytree=0.7, gamma=0.1, learning_rate=0.05, max_depth=5, n_estimators=100, subsample=0.7; total time=   1.3s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.2, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.7; total time=   3.0s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.2, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.7; total time=   3.1s
[CV] END colsample_bytree=0.7, gamma=0.2, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.7; total time=   4.3s
[CV] END colsample_bytree=0.7, gamma=0.2, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.7; total time=   2.9s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.2, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.7; total time=   4.1s
[CV] END colsample_bytree=0.7, gamma=0.1, learning_rate=0.05, max_depth=5, n_estimators=100, subsample=0.7; total time=   1.3s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.1, learning_rate=0.05, max_depth=5, n_estimators=100, subsample=0.7; total time=   2.9s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.1, learning_rate=0.05, max_depth=5, n_estimators=100, subsample=0.7; total time=   2.7s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0.5, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.8; total time=   2.3s
[CV] END colsample_bytree=1.0, gamma=0.5, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.8; total time=   2.3s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0.5, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.8; total time=   2.3s
[CV] END colsample_bytree=0.8, gamma=0.1, learning_rate=0.01, max_depth=5, n_estimators=200, subsample=0.7; total time=   2.4s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=1.0, gamma=0.5, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.8; total time=   3.3s
[CV] END colsample_bytree=1.0, gamma=0.5, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.8; total time=   3.4s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.1, learning_rate=0.01, max_depth=5, n_estimators=200, subsample=0.7; total time=   3.2s
[CV] END colsample_bytree=0.8, gamma=0.1, learning_rate=0.01, max_depth=5, n_estimators=200, subsample=0.7; total time=   2.6s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.1, learning_rate=0.01, max_depth=5, n_estimators=200, subsample=0.7; total time=   3.1s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.1, learning_rate=0.01, max_depth=5, n_estimators=200, subsample=0.7; total time=   4.5s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.5, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.7; total time=   2.5s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.5, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.7; total time=   3.0s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.5, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.7; total time=   2.4s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.5, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.7; total time=   4.0s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0.5, learning_rate=0.2, max_depth=7, n_estimators=300, subsample=0.7; total time=   2.7s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0, learning_rate=0.01, max_depth=10, n_estimators=300, subsample=0.7; total time=  11.5s
[CV] END colsample_bytree=0.7, gamma=0, learning_rate=0.01, max_depth=10, n_estimators=300, subsample=0.7; total time=  11.5s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0, learning_rate=0.01, max_depth=10, n_estimators=300, subsample=0.7; total time=  11.5s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0, learning_rate=0.01, max_depth=10, n_estimators=300, subsample=0.7; total time=  11.8s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0, learning_rate=0.1, max_depth=10, n_estimators=300, subsample=0.8; total time=   7.7s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0, learning_rate=0.01, max_depth=10, n_estimators=300, subsample=0.7; total time=  14.1s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.01, max_depth=3, n_estimators=300, subsample=0.7; total time=   2.8s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0, learning_rate=0.1, max_depth=10, n_estimators=300, subsample=0.8; total time=   8.3s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.01, max_depth=3, n_estimators=300, subsample=0.7; total time=   2.4s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.8, gamma=0, learning_rate=0.1, max_depth=10, n_estimators=300, subsample=0.8; total time=   8.7s
[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.01, max_depth=3, n_estimators=300, subsample=0.7; total time=   2.7s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)
Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.01, max_depth=3, n_estimators=300, subsample=0.7; total time=   3.0s
[CV] END colsample_bytree=0.7, gamma=0.5, learning_rate=0.01, max_depth=3, n_estimators=300, subsample=0.7; total time=   2.8s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


[CV] END colsample_bytree=0.7, gamma=0.2, learning_rate=0.1, max_depth=10, n_estimators=200, subsample=1.0; total time=   2.7s
[CV] END colsample_bytree=0.8, gamma=0, learning_rate=0.1, max_depth=10, n_estimators=300, subsample=0.8; total time=   7.4s
[CV] END colsample_bytree=0.7, gamma=0.2, learning_rate=0.1, max_depth=10, n_estimators=200, subsample=1.0; total time=   3.3s
[CV] END colsample_bytree=0.8, gamma=0, learning_rate=0.1, max_depth=10, n_estimators=300, subsample=0.8; total time=   7.8s
[CV] END colsample_bytree=0.7, gamma=0.2, learning_rate=0.1, max_depth=10, n_estimators=200, subsample=1.0; total time=   2.6s
[CV] END colsample_bytree=0.7, gamma=0.2, learning_rate=0.1, max_depth=10, n_estimators=200, subsample=1.0; total time=   2.6s
[CV] END colsample_bytree=0.7, gamma=0.2, learning_rate=0.1, max_depth=10, n_estimators=200, subsample=1.0; total time=   2.1s


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


Best parameters found: {'subsample': 0.7, 'n_estimators': 100, 'max_depth': 10, 'learning_rate': 0.05, 'gamma': 0.2, 'colsample_bytree': 0.8}
Best cross-validation score: 0.7911041011502872


Parameters: { "use_label_encoder" } are not used.

  bst.update(dtrain, iteration=i, fobj=obj)


✅ Submission file with ID saved as submission.csv


primeiro xgboost