Datos originales

In [19]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.impute import SimpleImputer
from sklearn.preprocessing import StandardScaler
from sklearn.ensemble import RandomForestRegressor
from xgboost import XGBRegressor
from lightgbm import LGBMRegressor
from sklearn.neighbors import KNeighborsRegressor
from sklearn.naive_bayes import GaussianNB
from sklearn.metrics import mean_absolute_error
import numpy as np

# Cargar los datos
train_features = pd.read_csv("dengue_features_train.csv")
train_labels = pd.read_csv("dengue_labels_train.csv")

# Unir las etiquetas con las características para análisis más sencillo
data = train_features.merge(train_labels, on=["city", "year", "weekofyear"])

# Separar por ciudad
data_sj = data[data["city"] == "sj"].drop(columns=["city"])
data_iq = data[data["city"] == "iq"].drop(columns=["city"])

# Características (sin la fecha y etiquetas)
features = [col for col in data_sj.columns if col not in ["total_cases", "week_start_date"]]

# Función para evaluar los modelos
def evaluate_advanced_models(data, selected_features, imputer, scaler, transformation="log"):
    X = data[selected_features]
    y = data["total_cases"]

    # Separar en entrenamiento y prueba
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

    # Imputación
    X_train = imputer.fit_transform(X_train)
    X_test = imputer.transform(X_test)

    # Aplicar transformación logarítmica
    if transformation == "log":
        X_train = np.log1p(np.abs(X_train))  # log(1 + x) para evitar problemas con ceros
        X_test = np.log1p(np.abs(X_test))

    # Escalado
    X_train = scaler.fit_transform(X_train)
    X_test = scaler.transform(X_test)

    # Modelos
    models = {
        "RandomForest": RandomForestRegressor(n_estimators=100, random_state=42),
        "XGBoost": XGBRegressor(n_estimators=100, random_state=42),
        "LightGBM": LGBMRegressor(n_estimators=100, random_state=42),
        "KNN": KNeighborsRegressor(n_neighbors=5),
        "NaiveBayes": GaussianNB()
    }

    results = {}
    for name, model in models.items():
        model.fit(X_train, y_train)
        y_pred = model.predict(X_test)
        results[name] = mean_absolute_error(y_test, y_pred)

    return results

# Imputador y escalador
imputer_sj = SimpleImputer(strategy="most_frequent")
imputer_iq = SimpleImputer(strategy="median")
scaler = StandardScaler()

# Evaluar para San Juan e Iquitos
results_sj = evaluate_advanced_models(data_sj, features, imputer_sj, scaler, "log")
results_iq = evaluate_advanced_models(data_iq, features, imputer_iq, scaler, "log")

# Crear DataFrame con los resultados
df_results = pd.DataFrame([results_sj, results_iq], index=["San Juan", "Iquitos"])

# Mostrar la tabla en el notebook
display(df_results.style.set_caption("Resultados de Modelos DengAI"))




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000405 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3816
[LightGBM] [Info] Number of data points in the train set: 748, number of used features: 22
[LightGBM] [Info] Start training from score 34.330214
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000277 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2398
[LightGBM] [Info] Number of data points in the train set: 416, number of used features: 22
[LightGBM] [Info] Start training from score 7.685096




Unnamed: 0,RandomForest,XGBoost,LightGBM,KNN,NaiveBayes
San Juan,14.809947,11.873291,14.610059,24.335106,32.819149
Iquitos,5.700673,5.525403,5.960778,7.571154,9.259615


Datos clean

In [21]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.impute import SimpleImputer
from sklearn.preprocessing import StandardScaler
from sklearn.ensemble import RandomForestRegressor
from xgboost import XGBRegressor
from lightgbm import LGBMRegressor
from sklearn.neighbors import KNeighborsRegressor
from sklearn.naive_bayes import GaussianNB
from sklearn.metrics import mean_absolute_error
import numpy as np
from IPython.display import display

# Cargar los datos LIMPIOS
data_sj = pd.read_csv("analisis/train_sj_clean.csv")
data_iq = pd.read_csv("analisis/train_iq_clean.csv")

# Características (sin la fecha y etiquetas)
features_sj = [col for col in data_sj.columns if col not in ["total_cases", "week_start_date"]]
features_iq = [col for col in data_iq.columns if col not in ["total_cases", "week_start_date"]]

# Función para evaluar los modelos
def evaluate_advanced_models(data, selected_features, imputer, scaler, transformation="log"):
    X = data[selected_features]
    y = data["total_cases"]

    # Separar en entrenamiento y prueba
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

    # Imputación
    X_train = imputer.fit_transform(X_train)
    X_test = imputer.transform(X_test)

    # Aplicar transformación logarítmica
    if transformation == "log":
        X_train = np.log1p(np.abs(X_train))  # log(1 + x) para evitar problemas con ceros
        X_test = np.log1p(np.abs(X_test))

    # Escalado
    X_train = scaler.fit_transform(X_train)
    X_test = scaler.transform(X_test)

    # Modelos
    models = {
        "RandomForest": RandomForestRegressor(n_estimators=100, random_state=42),
        "XGBoost": XGBRegressor(n_estimators=100, random_state=42),
        "LightGBM": LGBMRegressor(n_estimators=100, random_state=42),
        "KNN": KNeighborsRegressor(n_neighbors=5),
        "NaiveBayes": GaussianNB()
    }

    results = {}
    for name, model in models.items():
        model.fit(X_train, y_train)
        y_pred = model.predict(X_test)
        results[name] = mean_absolute_error(y_test, y_pred)

    return results

# Imputador y escalador
imputer_sj = SimpleImputer(strategy="most_frequent")
imputer_iq = SimpleImputer(strategy="median")
scaler = StandardScaler()

# Evaluar para San Juan e Iquitos usando los datos LIMPIOS
results_sj = evaluate_advanced_models(data_sj, features_sj, imputer_sj, scaler, "log")
results_iq = evaluate_advanced_models(data_iq, features_iq, imputer_iq, scaler, "log")

# Crear DataFrame con los resultados
df_results = pd.DataFrame([results_sj, results_iq], index=["San Juan", "Iquitos"])

# Mostrar la tabla en el notebook
display(df_results)




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000159 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3839
[LightGBM] [Info] Number of data points in the train set: 748, number of used features: 22
[LightGBM] [Info] Start training from score 34.330214
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000161 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2420
[LightGBM] [Info] Number of data points in the train set: 416, number of used features: 22
[LightGBM] [Info] Start training from score 7.685096




Unnamed: 0,RandomForest,XGBoost,LightGBM,KNN,NaiveBayes
San Juan,15.322181,12.1365,16.724204,23.8,32.62766
Iquitos,5.751442,5.510869,5.644914,7.344231,9.5


Clean 2

In [23]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.impute import SimpleImputer
from sklearn.preprocessing import StandardScaler
from sklearn.ensemble import RandomForestRegressor
from xgboost import XGBRegressor
from lightgbm import LGBMRegressor
from sklearn.neighbors import KNeighborsRegressor
from sklearn.naive_bayes import GaussianNB
from sklearn.metrics import mean_absolute_error
import numpy as np
from IPython.display import display

# Cargar los datos LIMPIOS
data_sj = pd.read_csv("analisis/train_sj_clean2.csv")
data_iq = pd.read_csv("analisis/train_iq_clean2.csv")

# Características (sin la fecha y etiquetas)
features_sj = [col for col in data_sj.columns if col not in ["total_cases", "week_start_date"]]
features_iq = [col for col in data_iq.columns if col not in ["total_cases", "week_start_date"]]

# Función para evaluar los modelos
def evaluate_advanced_models(data, selected_features, imputer, scaler, transformation="log"):
    X = data[selected_features]
    y = data["total_cases"]

    # Separar en entrenamiento y prueba
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

    # Imputación
    X_train = imputer.fit_transform(X_train)
    X_test = imputer.transform(X_test)

    # Aplicar transformación logarítmica
    if transformation == "log":
        X_train = np.log1p(np.abs(X_train))  # log(1 + x) para evitar problemas con ceros
        X_test = np.log1p(np.abs(X_test))

    # Escalado
    X_train = scaler.fit_transform(X_train)
    X_test = scaler.transform(X_test)

    # Modelos
    models = {
        "RandomForest": RandomForestRegressor(n_estimators=100, random_state=42),
        "XGBoost": XGBRegressor(n_estimators=100, random_state=42),
        "LightGBM": LGBMRegressor(n_estimators=100, random_state=42),
        "KNN": KNeighborsRegressor(n_neighbors=5),
        "NaiveBayes": GaussianNB()
    }

    results = {}
    for name, model in models.items():
        model.fit(X_train, y_train)
        y_pred = model.predict(X_test)
        results[name] = mean_absolute_error(y_test, y_pred)

    return results

# Imputador y escalador
imputer_sj = SimpleImputer(strategy="most_frequent")
imputer_iq = SimpleImputer(strategy="median")
scaler = StandardScaler()

# Evaluar para San Juan e Iquitos usando los datos LIMPIOS
results_sj = evaluate_advanced_models(data_sj, features_sj, imputer_sj, scaler, "log")
results_iq = evaluate_advanced_models(data_iq, features_iq, imputer_iq, scaler, "log")

# Crear DataFrame con los resultados
df_results = pd.DataFrame([results_sj, results_iq], index=["San Juan", "Iquitos"])

# Mostrar la tabla en el notebook
display(df_results)




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000164 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3839
[LightGBM] [Info] Number of data points in the train set: 748, number of used features: 22
[LightGBM] [Info] Start training from score 34.330214
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000119 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2420
[LightGBM] [Info] Number of data points in the train set: 416, number of used features: 22
[LightGBM] [Info] Start training from score 7.685096




Unnamed: 0,RandomForest,XGBoost,LightGBM,KNN,NaiveBayes
San Juan,15.322181,12.1365,16.724204,23.8,32.62766
Iquitos,5.751442,5.510869,5.644914,7.344231,9.5


XGBoost y LightGBM

In [28]:
import pandas as pd
from sklearn.model_selection import train_test_split, GridSearchCV
from sklearn.impute import SimpleImputer
from sklearn.preprocessing import StandardScaler
from xgboost import XGBRegressor
from lightgbm import LGBMRegressor
from sklearn.metrics import mean_absolute_error
import numpy as np

# Cargar los datos procesados
train_sj = pd.read_csv("analisis/train_sj_clean.csv")
train_iq = pd.read_csv("analisis/train_iq_clean.csv")

# Características (sin la fecha y etiquetas)
features = [col for col in train_sj.columns if col not in ["total_cases", "week_start_date"]]

# Preparar los datos
X_sj = train_sj[features]
y_sj = train_sj["total_cases"]
X_iq = train_iq[features]
y_iq = train_iq["total_cases"]

# Imputación y escalado
imputer_sj = SimpleImputer(strategy="most_frequent")
imputer_iq = SimpleImputer(strategy="median")
scaler = StandardScaler()

# Dividir en entrenamiento y prueba
X_train_sj, X_test_sj, y_train_sj, y_test_sj = train_test_split(X_sj, y_sj, test_size=0.2, random_state=42)
X_train_iq, X_test_iq, y_train_iq, y_test_iq = train_test_split(X_iq, y_iq, test_size=0.2, random_state=42)

# Preprocesar los datos
X_train_sj = imputer_sj.fit_transform(X_train_sj)
X_test_sj = imputer_sj.transform(X_test_sj)
X_train_iq = imputer_iq.fit_transform(X_train_iq)
X_test_iq = imputer_iq.transform(X_test_iq)

X_train_sj = scaler.fit_transform(X_train_sj)
X_test_sj = scaler.transform(X_test_sj)
X_train_iq = scaler.fit_transform(X_train_iq)
X_test_iq = scaler.transform(X_test_iq)

# Definir el espacio de búsqueda para XGBoost
xgb_param_grid = {
    'n_estimators': [100, 200],
    'learning_rate': [0.01, 0.1, 0.2],
    'max_depth': [3, 5, 7],
    'subsample': [0.8, 1.0]
}

# Definir el espacio de búsqueda para LightGBM
lgb_param_grid = {
    'n_estimators': [100, 200],
    'learning_rate': [0.01, 0.1, 0.2],
    'max_depth': [3, 5, 7],
    'num_leaves': [31, 50]
}

# Función para optimizar los modelos
def optimize_model(model, param_grid, X_train, y_train):
    grid_search = GridSearchCV(estimator=model, param_grid=param_grid, scoring='neg_mean_absolute_error', cv=5)
    grid_search.fit(X_train, y_train)
    return grid_search.best_params_, grid_search.best_score_

# Optimización de XGBoost y LightGBM para San Juan
best_params_xgb_sj, best_score_xgb_sj = optimize_model(XGBRegressor(random_state=42), xgb_param_grid, X_train_sj, y_train_sj)
best_params_lgb_sj, best_score_lgb_sj = optimize_model(LGBMRegressor(random_state=42), lgb_param_grid, X_train_sj, y_train_sj)

# Optimización de XGBoost y LightGBM para Iquitos
best_params_xgb_iq, best_score_xgb_iq = optimize_model(XGBRegressor(random_state=42), xgb_param_grid, X_train_iq, y_train_iq)
best_params_lgb_iq, best_score_lgb_iq = optimize_model(LGBMRegressor(random_state=42), lgb_param_grid, X_train_iq, y_train_iq)

# Función para evaluar los modelos
def evaluate_advanced_models(data, selected_features, imputer, scaler, transformation="log"):
    X = data[selected_features]
    y = data["total_cases"]

    # Separar en entrenamiento y prueba
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

    # Imputación
    X_train = imputer.fit_transform(X_train)
    X_test = imputer.transform(X_test)

    # Aplicar transformación logarítmica
    if transformation == "log":
        X_train = np.log1p(np.abs(X_train))  # log(1 + x) para evitar problemas con ceros
        X_test = np.log1p(np.abs(X_test))

    # Escalado
    X_train = scaler.fit_transform(X_train)
    X_test = scaler.transform(X_test)

    # Modelos
    models = {
        "XGBoost": XGBRegressor(n_estimators=100, random_state=42),
        "LightGBM": LGBMRegressor(n_estimators=100, random_state=42)
    }

    results = {}
    for name, model in models.items():
        model.fit(X_train, y_train)
        y_pred = model.predict(X_test)
        results[name] = mean_absolute_error(y_test, y_pred)

    return results

# Evaluar los modelos optimizados para San Juan e Iquitos
sj_results = evaluate_advanced_models(train_sj, features, imputer_sj, scaler, "log")
iq_results = evaluate_advanced_models(train_iq, features, imputer_iq, scaler, "log")

# Imprimir los resultados
print("Resultados optimizados para San Juan:", sj_results)
print("Resultados optimizados para Iquitos:", iq_results)




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000258 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000258 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000257 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000257 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000241 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000242 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000382 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000235 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000226 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000566 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000380 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000593 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000223 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000593 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000230 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000302 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000220 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000574 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000245 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000233 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000241 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000914 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000264 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000242 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000381 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000288 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000556 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000282 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000860 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000580 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000590 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000344 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000215 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000231 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000335 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000209 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000560 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000584 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001120 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000592 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000229 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000574 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000238 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000231 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000382 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000563 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000219 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000229 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000263 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000236 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000534 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000404 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000256 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000223 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000221 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000363 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.007876 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000251 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000584 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000279 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000381 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000406 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000255 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000423 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000218 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000261 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000581 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000237 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000575 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000232 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000230 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000399 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000241 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000216 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.013136 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000252 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000253 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000385 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000394 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000351 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000244 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000251 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000641 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000236 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000222 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000220 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000559 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000570 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000219 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000412 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000593 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000632 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000416 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000264 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000255 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000233 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000255 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000616 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000242 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000750 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002162 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000570 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000527 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000234 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000630 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000281 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001123 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000251 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000264 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000513 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000243 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000399 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000233 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000236 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000267 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000532 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000252 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000262 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000259 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000255 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000228 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000464 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000640 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000255 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000618 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000238 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000396 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000382 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000790 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000297 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000604 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000260 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000606 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000241 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000236 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000246 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000597 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000244 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000231 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002979 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000264 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000237 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000272 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000247 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000242 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000250 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000218 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start trainin



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000552 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000384 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.170569




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000327 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3210
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 34.541806




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000242 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3219
[LightGBM] [Info] Number of data points in the train set: 598, number of used features: 22
[LightGBM] [Info] Start training from score 33.605351
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000623 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3214
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.113523




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000254 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3227
[LightGBM] [Info] Number of data points in the train set: 599, number of used features: 22
[LightGBM] [Info] Start training from score 35.217028




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000300 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3956
[LightGBM] [Info] Number of data points in the train set: 748, number of used features: 22
[LightGBM] [Info] Start training from score 34.330214




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000176 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000437 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000455 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000396 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000415 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000335 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000408 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000172 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000428 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000276 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000431 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000167 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000203 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000167 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000290 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 33



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000168 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001032 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000272 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000181 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000175 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000178 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000161 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000425 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000170 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000403 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000171 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000163 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000163 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000269 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000422 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000389 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000251 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000186 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000438 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000173 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000202 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000305 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000170 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000173 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000161 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.005460 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000586 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000221 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000256 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.007436 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000290 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000182 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000423 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000419 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000169 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000409 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000905 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000170 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000211 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000182 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000271 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000420 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000437 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000156 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000302 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002316 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000816 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000232 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000181 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000258 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000263 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000397 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000186 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000435 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000438 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000269 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.013945 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000335 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000177 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000263 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000236 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000172 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000429 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000178 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000390 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000410 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000297 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000277 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000181 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000314 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000190 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22




[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000359 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000459 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000183 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000352 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000264 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000176 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000173 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000322 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000430 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000185 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.039180 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000450 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000179 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 33



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000324 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000231 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000452 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.018156 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000458 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000430 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000452 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000162 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000268 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000251 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000165 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000181 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000192 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000275 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000420 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000459 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.010960 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000349 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000473 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000448 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000187 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000186 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000465 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000428 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000183 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000281 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000191 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000432 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000576 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000284 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000269 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000182 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.007722 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000362 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000572 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000189 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000324 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.534535




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000186 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000455 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000178 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1994
[LightGBM] [Info] Number of data points in the train set: 332, number of used features: 22
[LightGBM] [Info] Start training from score 7.846386
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000423 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2003
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.357357
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000443 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2004
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training 



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000179 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1997
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 7.675676




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000176 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1995
[LightGBM] [Info] Number of data points in the train set: 333, number of used features: 22
[LightGBM] [Info] Start training from score 8.012012




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000349 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2437
[LightGBM] [Info] Number of data points in the train set: 416, number of used features: 22
[LightGBM] [Info] Start training from score 7.685096




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000347 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3839
[LightGBM] [Info] Number of data points in the train set: 748, number of used features: 22
[LightGBM] [Info] Start training from score 34.330214
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000300 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2420
[LightGBM] [Info] Number of data points in the train set: 416, number of used features: 22
[LightGBM] [Info] Start training from score 7.685096
Resultados optimizados para San Juan: {'XGBoost': 12.136500358581543, 'LightGBM': 16.72420415587116}
Resultados optimizados para Iquitos: {'XGBoost': 5.510868549346924, 'LightGBM': 5.644913590452571}




Optimizar LightGBM

In [29]:
import pandas as pd
import lightgbm as lgb
import os
from sklearn.impute import SimpleImputer
from sklearn.preprocessing import StandardScaler

# Crear carpeta para resultados
os.makedirs("resultado", exist_ok=True)

# Cargar datos preprocesados
train_sj = pd.read_csv("analisis/train_sj_clean.csv")
train_iq = pd.read_csv("analisis/train_iq_clean.csv")
test_features = pd.read_csv("dengue_features_test.csv")
submission_format = pd.read_csv("submission_format.csv")

# Definir características
features = [col for col in train_sj.columns if col not in ["total_cases", "week_start_date"]]

# Preparar conjuntos de entrenamiento
X_sj, y_sj = train_sj[features], train_sj["total_cases"]
X_iq, y_iq = train_iq[features], train_iq["total_cases"]

# Imputadores y escalador
imputer_sj = SimpleImputer(strategy="most_frequent")
imputer_iq = SimpleImputer(strategy="median")
scaler = StandardScaler()

# Aplicar preprocesamiento
X_sj = scaler.fit_transform(imputer_sj.fit_transform(X_sj))
X_iq = scaler.fit_transform(imputer_iq.fit_transform(X_iq))

# Separar test por ciudad
test_sj = test_features[test_features["city"] == "sj"][features]
test_iq = test_features[test_features["city"] == "iq"][features]

# Aplicar preprocesamiento a test
test_sj = scaler.transform(imputer_sj.transform(test_sj))
test_iq = scaler.transform(imputer_iq.transform(test_iq))

# Parámetros optimizados para LightGBM
params_sj = {
    "feature_fraction": 1.0, "lambda_l1": 0.0, "lambda_l2": 0.0, "learning_rate": 0.05,
    "max_depth": 7, "min_data_in_leaf": 20, "min_split_gain": 0.0,
    "n_estimators": 100, "num_leaves": 31
}
params_iq = {
    "feature_fraction": 1.0, "lambda_l1": 0.0, "lambda_l2": 0.2, "learning_rate": 0.05,
    "max_depth": 5, "min_data_in_leaf": 20, "min_split_gain": 0.2,
    "n_estimators": 100, "num_leaves": 31
}

# Entrenar modelos LightGBM
model_sj = lgb.LGBMRegressor(**params_sj)
model_sj.fit(X_sj, y_sj)

model_iq = lgb.LGBMRegressor(**params_iq)
model_iq.fit(X_iq, y_iq)

# Hacer predicciones
pred_sj = model_sj.predict(test_sj).round().astype(int)
pred_iq = model_iq.predict(test_iq).round().astype(int)

# Evitar valores negativos
pred_sj = pred_sj.clip(min=0)
pred_iq = pred_iq.clip(min=0)

# Crear archivo de submission
submission = submission_format.copy()
submission.loc[submission["city"] == "sj", "total_cases"] = pred_sj
submission.loc[submission["city"] == "iq", "total_cases"] = pred_iq

# Guardar submission en la carpeta "resultado"
submission_path = "resultado/submission_lightgbm.csv"
submission.to_csv(submission_path, index=False)

print(f"Archivo guardado en: {submission_path}")

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000176 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 4087
[LightGBM] [Info] Number of data points in the train set: 936, number of used features: 22
[LightGBM] [Info] Start training from score 34.180556
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000287 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3002
[LightGBM] [Info] Number of data points in the train set: 520, number of used features: 22
[LightGBM] [Info] Start training from score 7.565385
Archivo guardado en: resultado/submission_lightgbm.csv




Optimizar XGBoost

In [30]:
import pandas as pd
import xgboost as xgb
import os
from sklearn.impute import SimpleImputer
from sklearn.preprocessing import StandardScaler

# Crear carpeta para resultados
os.makedirs("resultado", exist_ok=True)

# Cargar datos preprocesados
train_sj = pd.read_csv("analisis/train_sj_clean.csv")
train_iq = pd.read_csv("analisis/train_iq_clean.csv")
test_features = pd.read_csv("dengue_features_test.csv")
submission_format = pd.read_csv("submission_format.csv")

# Definir características
features = [col for col in train_sj.columns if col not in ["total_cases", "week_start_date"]]

# Preparar conjuntos de entrenamiento
X_sj, y_sj = train_sj[features], train_sj["total_cases"]
X_iq, y_iq = train_iq[features], train_iq["total_cases"]

# Imputadores y escalador
imputer_sj = SimpleImputer(strategy="most_frequent")
imputer_iq = SimpleImputer(strategy="median")
scaler = StandardScaler()

# Aplicar preprocesamiento
X_sj = scaler.fit_transform(imputer_sj.fit_transform(X_sj))
X_iq = scaler.fit_transform(imputer_iq.fit_transform(X_iq))

# Separar test por ciudad
test_sj = test_features[test_features["city"] == "sj"][features]
test_iq = test_features[test_features["city"] == "iq"][features]

# Aplicar preprocesamiento a test
test_sj = scaler.transform(imputer_sj.transform(test_sj))
test_iq = scaler.transform(imputer_iq.transform(test_iq))

# Parámetros óptimos para XGBoost
params_sj = {
    "objective": "reg:squarederror",
    "learning_rate": 0.05,
    "max_depth": 7,
    "n_estimators": 200,
    "subsample": 0.8,
    "colsample_bytree": 0.8
}
params_iq = {
    "objective": "reg:squarederror",
    "learning_rate": 0.05,
    "max_depth": 5,
    "n_estimators": 200,
    "subsample": 0.8,
    "colsample_bytree": 0.8
}

# Entrenar modelos XGBoost
model_sj = xgb.XGBRegressor(**params_sj)
model_sj.fit(X_sj, y_sj)

model_iq = xgb.XGBRegressor(**params_iq)
model_iq.fit(X_iq, y_iq)

# Hacer predicciones
pred_sj = model_sj.predict(test_sj).round().astype(int)
pred_iq = model_iq.predict(test_iq).round().astype(int)

# Evitar valores negativos
pred_sj = pred_sj.clip(min=0)
pred_iq = pred_iq.clip(min=0)

# Crear archivo de submission
submission = submission_format.copy()
submission.loc[submission["city"] == "sj", "total_cases"] = pred_sj
submission.loc[submission["city"] == "iq", "total_cases"] = pred_iq

# Guardar submission en la carpeta "resultado"
submission_path = "resultado/submission_xgboost.csv"
submission.to_csv(submission_path, index=False)

print(f"Archivo guardado en: {submission_path}")

Archivo guardado en: resultado/submission_xgboost.csv


Mejorar MAE XGBoost 1

In [31]:
import pandas as pd
import xgboost as xgb
from sklearn.impute import SimpleImputer
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_absolute_error

# Cargar datos preprocesados
train_sj = pd.read_csv("analisis/train_sj_clean.csv")
train_iq = pd.read_csv("analisis/train_iq_clean.csv")

# Definir características
features = [col for col in train_sj.columns if col not in ["total_cases", "week_start_date"]]

# Preparar conjuntos de entrenamiento
X_sj, y_sj = train_sj[features], train_sj["total_cases"]
X_iq, y_iq = train_iq[features], train_iq["total_cases"]

# Imputadores y escalador
imputer_sj = SimpleImputer(strategy="most_frequent")
imputer_iq = SimpleImputer(strategy="median")
scaler = StandardScaler()

# Aplicar preprocesamiento
X_sj = scaler.fit_transform(imputer_sj.fit_transform(X_sj))
X_iq = scaler.fit_transform(imputer_iq.fit_transform(X_iq))

# Dividir en entrenamiento (80%) y validación (20%)
X_train_sj, X_val_sj, y_train_sj, y_val_sj = train_test_split(X_sj, y_sj, test_size=0.2, random_state=42)
X_train_iq, X_val_iq, y_train_iq, y_val_iq = train_test_split(X_iq, y_iq, test_size=0.2, random_state=42)

# 🚀 **Nuevos hiperparámetros ajustados para XGBoost**
params_sj = {
    "objective": "reg:squarederror",
    "learning_rate": 0.03,  
    "max_depth": 6,  
    "n_estimators": 300,  
    "subsample": 0.8,
    "colsample_bytree": 0.8
}
params_iq = {
    "objective": "reg:squarederror",
    "learning_rate": 0.03,
    "max_depth": 5,  
    "n_estimators": 300,
    "subsample": 0.8,
    "colsample_bytree": 0.8
}

# Entrenar modelos XGBoost con los nuevos hiperparámetros
model_sj = xgb.XGBRegressor(**params_sj)
model_sj.fit(X_train_sj, y_train_sj)

model_iq = xgb.XGBRegressor(**params_iq)
model_iq.fit(X_train_iq, y_train_iq)

# Hacer predicciones en validación
pred_val_sj = model_sj.predict(X_val_sj).round().astype(int)
pred_val_iq = model_iq.predict(X_val_iq).round().astype(int)

# Evitar valores negativos
pred_val_sj = pred_val_sj.clip(min=0)
pred_val_iq = pred_val_iq.clip(min=0)

# Calcular MAE en validación
mae_sj = mean_absolute_error(y_val_sj, pred_val_sj)
mae_iq = mean_absolute_error(y_val_iq, pred_val_iq)

# MAE total promedio
mae_total = (mae_sj + mae_iq) / 2

print(f"MAE en validación para San Juan: {mae_sj}")
print(f"MAE en validación para Iquitos: {mae_iq}")
print(f"MAE total promedio: {mae_total}")

MAE en validación para San Juan: 13.148936170212766
MAE en validación para Iquitos: 5.076923076923077
MAE total promedio: 9.112929623567922
