In [None]:
! pip install mlflow awscli boto3 optuna imbalanced-learn lightgbm

In [None]:
! aws configure

In [3]:
import mlflow
mlflow.set_tracking_uri('http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/')

In [4]:
mlflow.set_experiment('E LightGBM HP Tuning')

<Experiment: artifact_location='s3://om-mlflow-bucket/621100004064027216', creation_time=1741370223256, experiment_id='621100004064027216', last_update_time=1741370223256, lifecycle_stage='active', name='E LightGBM HP Tuning', tags={}>

In [5]:
import pandas as pd
df=pd.read_csv('/content/reddit_processed.csv').dropna()

In [6]:
import pandas as pd
import mlflow
import mlflow.sklearn
import optuna
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score,classification_report
from imblearn.over_sampling import SMOTE
from lightgbm import LGBMClassifier
import matplotlib.pyplot as plt



In [7]:
# Remap the Class Labels
df['category']=df['category'].map({-1:2,0:0,1:1})

df=df.dropna(subset=['category'])

In [8]:
# Train Test Split
X=df['clean_comment']
y=df['category']
X_train,X_test,y_train,y_test=train_test_split(X ,y,test_size=0.2,random_state=42,stratify=y)

In [9]:
# TfidfVectorizer Setup
ngram_range=(1,3)
max_features=10000

vectorizer=TfidfVectorizer(ngram_range=ngram_range,max_features=max_features)
X_train=vectorizer.fit_transform(X_train)
X_test=vectorizer.transform(X_test)


In [10]:
# Apply SMOTE to handle inbalanced data
smote=SMOTE(random_state=42)
X_train,y_train=smote.fit_resample(X_train,y_train)



In [11]:
# Function to log results in MLflow
def log_mlflow(model_name, model, X_train, X_test, y_train, y_test, params, trial_number):
    with mlflow.start_run():
        # Log model type and trial number
        mlflow.set_tag("mlflow.runName", f"Trial_{trial_number}_{model_name}_SMOTE_TFIDF_Trigrams")
        mlflow.set_tag("experiment_type", "algorithm_comparison")

        # Log algorithm name as a parameter
        mlflow.log_param("algo_name", model_name)

        # Log hyperparameters
        for key, value in params.items():
            mlflow.log_param(key, value)

        # Train model
        model.fit(X_train, y_train)
        y_pred = model.predict(X_test)

        # Log accuracy
        accuracy = accuracy_score(y_test, y_pred)
        mlflow.log_metric("accuracy", accuracy)

        # Log classification report
        classification_rep = classification_report(y_test, y_pred, output_dict=True)
        for label, metrics in classification_rep.items():
            if isinstance(metrics, dict):
                for metric, value in metrics.items():
                    mlflow.log_metric(f"{label}_{metric}", value)

        # Log the model
        mlflow.sklearn.log_model(model, f"{model_name}_model")

        return accuracy




In [12]:
# Step 6: Optuna objective function for LightGBM
def objective_lightgbm(trial):
    # Hyperparameter space to explore
    n_estimators = trial.suggest_int('n_estimators', 100, 1000)
    learning_rate = trial.suggest_float('learning_rate', 1e-4, 1e-1, log=True)
    max_depth = trial.suggest_int('max_depth', 3, 15)
    num_leaves = trial.suggest_int('num_leaves', 20, 150)
    min_child_samples = trial.suggest_int('min_child_samples', 10, 100)
    colsample_bytree = trial.suggest_float('colsample_bytree', 0.5, 1.0)
    subsample = trial.suggest_float('subsample', 0.5, 1.0)
    reg_alpha = trial.suggest_float('reg_alpha', 1e-4, 10.0, log=True)  # L1 regularization
    reg_lambda = trial.suggest_float('reg_lambda', 1e-4, 10.0, log=True)  # L2 regularization

    # Log trial parameters
    params = {
        'n_estimators': n_estimators,
        'learning_rate': learning_rate,
        'max_depth': max_depth,
        'num_leaves': num_leaves,
        'min_child_samples': min_child_samples,
        'colsample_bytree': colsample_bytree,
        'subsample': subsample,
        'reg_alpha': reg_alpha,
        'reg_lambda': reg_lambda
    }

    # Create LightGBM model
    model = LGBMClassifier(n_estimators=n_estimators,
                           learning_rate=learning_rate,
                           max_depth=max_depth,
                           num_leaves=num_leaves,
                           min_child_samples=min_child_samples,
                           colsample_bytree=colsample_bytree,
                           subsample=subsample,
                           reg_alpha=reg_alpha,
                           reg_lambda=reg_lambda,
                           random_state=42)

    # Log each trial as a separate run in MLflow
    accuracy = log_mlflow("LightGBM", model, X_train, X_test, y_train, y_test, params, trial.number)

    return accuracy




In [13]:
# Step 7: Run Optuna for LightGBM, log the best model, and plot the importance of each parameter
def run_optuna_experiment():
    study = optuna.create_study(direction="maximize")
    study.optimize(objective_lightgbm, n_trials=100)  # Increased to 100 trials

    # Get the best parameters
    best_params = study.best_params
    best_model = LGBMClassifier(n_estimators=best_params['n_estimators'],
                                learning_rate=best_params['learning_rate'],
                                max_depth=best_params['max_depth'],
                                num_leaves=best_params['num_leaves'],
                                min_child_samples=best_params['min_child_samples'],
                                colsample_bytree=best_params['colsample_bytree'],
                                subsample=best_params['subsample'],
                                reg_alpha=best_params['reg_alpha'],
                                reg_lambda=best_params['reg_lambda'],
                                random_state=42)

    # Log the best model with MLflow and print the classification report
    log_mlflow("LightGBM", best_model, X_train, X_test, y_train, y_test, best_params, "Best")

    # Plot parameter importance
    optuna.visualization.plot_param_importances(study).show()

    # Plot optimization history
    optuna.visualization.plot_optimization_history(study).show()

In [14]:
# Run the experiment for LightGBM
run_optuna_experiment()

[I 2025-03-08 03:03:03,996] A new study created in memory with name: no-name-8546ca5c-9ad8-4c4a-9e53-2ae94547065b


[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.120613 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 57101
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 693
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:03:28,707] Trial 0 finished with value: 0.8265000879816998 and parameters: {'n_estimators': 407, 'learning_rate': 0.006637439113100485, 'max_depth': 14, 'num_leaves': 23, 'min_child_samples': 98, 'colsample_bytree': 0.8616128055513101, 'subsample': 0.6435849625319907, 'reg_alpha': 0.2214017224090471, 'reg_lambda': 0.41216201180141243}. Best is trial 0 with value: 0.8265000879816998.


🏃 View run Trial_0_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/1616e6b222284ea7b5648c28a8ffec0a
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.666916 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 92752
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2939
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:03:59,789] Trial 1 finished with value: 0.7232095724089389 and parameters: {'n_estimators': 427, 'learning_rate': 0.00030737890282591827, 'max_depth': 9, 'num_leaves': 33, 'min_child_samples': 23, 'colsample_bytree': 0.8432086073316514, 'subsample': 0.5749082223136656, 'reg_alpha': 0.013274329277211831, 'reg_lambda': 0.14558172886634305}. Best is trial 0 with value: 0.8265000879816998.


🏃 View run Trial_1_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/0d999d46105542298916cfeab06063de
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.270776 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 98233
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3607
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:04:48,334] Trial 2 finished with value: 0.8265000879816998 and parameters: {'n_estimators': 709, 'learning_rate': 0.008401519849374246, 'max_depth': 6, 'num_leaves': 75, 'min_child_samples': 19, 'colsample_bytree': 0.558248703164719, 'subsample': 0.9255680211734657, 'reg_alpha': 0.0010778858472904056, 'reg_lambda': 0.38415915908964376}. Best is trial 0 with value: 0.8265000879816998.


🏃 View run Trial_2_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/2f27db0673154a4c916daf55fc1cafd1
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.115625 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 57101
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 693
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:05:12,435] Trial 3 finished with value: 0.8356501847615696 and parameters: {'n_estimators': 475, 'learning_rate': 0.007008795935965904, 'max_depth': 15, 'num_leaves': 111, 'min_child_samples': 98, 'colsample_bytree': 0.974323397184466, 'subsample': 0.8441046271457853, 'reg_alpha': 0.04381667699683568, 'reg_lambda': 4.077643527922316}. Best is trial 3 with value: 0.8356501847615696.


🏃 View run Trial_3_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/dd112cf65f1146ca92a320d3c2abfdc1
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.141725 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 62345
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 866
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:05:28,616] Trial 4 finished with value: 0.7696639099067394 and parameters: {'n_estimators': 114, 'learning_rate': 0.0025046522302895153, 'max_depth': 9, 'num_leaves': 115, 'min_child_samples': 79, 'colsample_bytree': 0.6440787456690594, 'subsample': 0.5566852890851488, 'reg_alpha': 0.0005047262281184057, 'reg_lambda': 0.0007518223323492491}. Best is trial 3 with value: 0.8356501847615696.


🏃 View run Trial_4_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/b3bc9f67fd614540bb7ab51ee1bfa64f
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.691612 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 113733
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 6244
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:05:53,175] Trial 5 finished with value: 0.8294914657751188 and parameters: {'n_estimators': 366, 'learning_rate': 0.018906570646988637, 'max_depth': 6, 'num_leaves': 59, 'min_child_samples': 11, 'colsample_bytree': 0.6333373267331621, 'subsample': 0.7994950873469439, 'reg_alpha': 4.206150250632513, 'reg_lambda': 0.044073448387256305}. Best is trial 3 with value: 0.8356501847615696.


🏃 View run Trial_5_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/96e47e183a84483a8c917f7be2b4a9e4
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.138241 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 59095
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 755
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:06:12,429] Trial 6 finished with value: 0.7920112616575752 and parameters: {'n_estimators': 234, 'learning_rate': 0.005462706503944479, 'max_depth': 11, 'num_leaves': 146, 'min_child_samples': 90, 'colsample_bytree': 0.7575061047092468, 'subsample': 0.6691688247529343, 'reg_alpha': 0.00801959958788121, 'reg_lambda': 0.000364988369576835}. Best is trial 3 with value: 0.8356501847615696.


🏃 View run Trial_6_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/327caf125a0a475785808bd0cdcf611e
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.294162 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 77457
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1607
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:06:33,844] Trial 7 finished with value: 0.6616223825444307 and parameters: {'n_estimators': 529, 'learning_rate': 0.00014952361954017726, 'max_depth': 5, 'num_leaves': 39, 'min_child_samples': 43, 'colsample_bytree': 0.8570085966772144, 'subsample': 0.8893444625051268, 'reg_alpha': 7.616135794258522, 'reg_lambda': 1.2576816003555031}. Best is trial 3 with value: 0.8356501847615696.


🏃 View run Trial_7_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/47aef558063f418994e023c82e96b5d1
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.184055 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 68219
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1106
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:07:00,249] Trial 8 finished with value: 0.7999296146401549 and parameters: {'n_estimators': 321, 'learning_rate': 0.00103454503026399, 'max_depth': 14, 'num_leaves': 130, 'min_child_samples': 62, 'colsample_bytree': 0.5838904802046809, 'subsample': 0.9113565223231062, 'reg_alpha': 0.003331326107288894, 'reg_lambda': 0.0024134325447191544}. Best is trial 3 with value: 0.8356501847615696.


🏃 View run Trial_8_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/a765d751568a4e80806345d762de6723
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.291178 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 76053
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1519
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:07:21,867] Trial 9 finished with value: 0.8238606369875066 and parameters: {'n_estimators': 264, 'learning_rate': 0.009135777239847688, 'max_depth': 15, 'num_leaves': 53, 'min_child_samples': 46, 'colsample_bytree': 0.7813725730133199, 'subsample': 0.9046366783943558, 'reg_alpha': 2.2470583994822735, 'reg_lambda': 0.9898946126166325}. Best is trial 3 with value: 0.8356501847615696.


🏃 View run Trial_9_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/d2d090545d37448390ae781052e6d2f5
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.169569 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 65224
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 977
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:07:52,093] Trial 10 finished with value: 0.8701390110856941 and parameters: {'n_estimators': 928, 'learning_rate': 0.09273190265183116, 'max_depth': 12, 'num_leaves': 99, 'min_child_samples': 71, 'colsample_bytree': 0.9970383379290503, 'subsample': 0.7893839998331489, 'reg_alpha': 0.1074513350777466, 'reg_lambda': 8.134155627587496}. Best is trial 10 with value: 0.8701390110856941.


🏃 View run Trial_10_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/083769f918be49d4be966978620403a2
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.166552 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 64826
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 961
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:08:23,599] Trial 11 finished with value: 0.8701390110856941 and parameters: {'n_estimators': 986, 'learning_rate': 0.062243359505200796, 'max_depth': 12, 'num_leaves': 101, 'min_child_samples': 72, 'colsample_bytree': 0.9896139325560394, 'subsample': 0.7800534400676912, 'reg_alpha': 0.1347623202635132, 'reg_lambda': 8.599305069197078}. Best is trial 10 with value: 0.8701390110856941.


🏃 View run Trial_11_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/c78c675be7e94601a490341b56e2c2fb
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.164819 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 65763
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 999
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:08:54,604] Trial 12 finished with value: 0.8741861692767904 and parameters: {'n_estimators': 919, 'learning_rate': 0.09106103903344485, 'max_depth': 12, 'num_leaves': 91, 'min_child_samples': 69, 'colsample_bytree': 0.9974844908947171, 'subsample': 0.7344432610373809, 'reg_alpha': 0.20898938790496296, 'reg_lambda': 9.336749618859171}. Best is trial 12 with value: 0.8741861692767904.


🏃 View run Trial_12_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/ab860f0f202d4e1ea4897b2ffc78e6f5
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.187251 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 68635
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1125
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:09:25,097] Trial 13 finished with value: 0.885095900052789 and parameters: {'n_estimators': 945, 'learning_rate': 0.07350952471078762, 'max_depth': 11, 'num_leaves': 87, 'min_child_samples': 61, 'colsample_bytree': 0.9297941825901642, 'subsample': 0.7036073603239092, 'reg_alpha': 0.6771010116432744, 'reg_lambda': 9.980180464298344}. Best is trial 13 with value: 0.885095900052789.


🏃 View run Trial_13_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/b175c71ec9724a0fa1d6d58898c0c100
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.222347 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72968
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1342
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:09:54,591] Trial 14 finished with value: 0.8960056308287876 and parameters: {'n_estimators': 801, 'learning_rate': 0.029860105616152183, 'max_depth': 10, 'num_leaves': 80, 'min_child_samples': 52, 'colsample_bytree': 0.9168236662468515, 'subsample': 0.6987267814844231, 'reg_alpha': 0.6640980064788415, 'reg_lambda': 0.004310616664149432}. Best is trial 14 with value: 0.8960056308287876.


🏃 View run Trial_14_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/1a86fa9f36244201bc7cfc641d33d384
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.250401 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73886
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1393
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:10:24,663] Trial 15 finished with value: 0.8930142530353686 and parameters: {'n_estimators': 725, 'learning_rate': 0.028553978603791653, 'max_depth': 8, 'num_leaves': 75, 'min_child_samples': 50, 'colsample_bytree': 0.9247026902540143, 'subsample': 0.997608931170739, 'reg_alpha': 1.0892012904121955, 'reg_lambda': 0.006005309074637286}. Best is trial 14 with value: 0.8960056308287876.


🏃 View run Trial_15_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/339ecc8bfd724ec98bbedd03a3dff890
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.344481 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 79942
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1776
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:10:52,765] Trial 16 finished with value: 0.8937181066338201 and parameters: {'n_estimators': 688, 'learning_rate': 0.025505452904720123, 'max_depth': 8, 'num_leaves': 70, 'min_child_samples': 39, 'colsample_bytree': 0.9077231408008698, 'subsample': 0.9713704700322661, 'reg_alpha': 1.1304774163727567, 'reg_lambda': 0.004803266736754811}. Best is trial 14 with value: 0.8960056308287876.


🏃 View run Trial_16_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/5d9bc02cbfe844428d0428d118cc1bb9
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.402783 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 84056
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2090
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:11:20,734] Trial 17 finished with value: 0.89248636283653 and parameters: {'n_estimators': 700, 'learning_rate': 0.024826291920570287, 'max_depth': 7, 'num_leaves': 64, 'min_child_samples': 33, 'colsample_bytree': 0.806018392567775, 'subsample': 0.6223780434251408, 'reg_alpha': 0.00013387346198035944, 'reg_lambda': 0.009256000159420076}. Best is trial 14 with value: 0.8960056308287876.


🏃 View run Trial_17_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/3eee2508adbc4d1683af8f857078c692
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.337413 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80541
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1819
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:11:41,919] Trial 18 finished with value: 0.7184585606193912 and parameters: {'n_estimators': 809, 'learning_rate': 0.0017721098605243076, 'max_depth': 3, 'num_leaves': 46, 'min_child_samples': 38, 'colsample_bytree': 0.7015696606611275, 'subsample': 0.5144526428998482, 'reg_alpha': 0.835527179541313, 'reg_lambda': 0.0259254198307199}. Best is trial 14 with value: 0.8960056308287876.


🏃 View run Trial_18_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/26f960cb7f9b4e9ea2b6443a1101cb57
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.710908 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 84786
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2151
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:12:12,513] Trial 19 finished with value: 0.9121942635931726 and parameters: {'n_estimators': 632, 'learning_rate': 0.03610350002793875, 'max_depth': 10, 'num_leaves': 72, 'min_child_samples': 32, 'colsample_bytree': 0.9118646418445241, 'subsample': 0.9895369419275302, 'reg_alpha': 0.5295243996036899, 'reg_lambda': 0.00011784316424629491}. Best is trial 19 with value: 0.9121942635931726.


🏃 View run Trial_19_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/d0be33d89cfa4957903b76b3b456c68e
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.230398 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 71583
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1269
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:12:38,586] Trial 20 finished with value: 0.8960056308287876 and parameters: {'n_estimators': 595, 'learning_rate': 0.04273927474276078, 'max_depth': 10, 'num_leaves': 81, 'min_child_samples': 55, 'colsample_bytree': 0.6961549978122414, 'subsample': 0.8352526465227146, 'reg_alpha': 0.05484372751615602, 'reg_lambda': 0.00011177331315867891}. Best is trial 19 with value: 0.9121942635931726.


🏃 View run Trial_20_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/3e76357accb74cb28c998dcd62b9e57b
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.246834 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72514
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1318
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:13:04,196] Trial 21 finished with value: 0.8979412282245293 and parameters: {'n_estimators': 594, 'learning_rate': 0.04148649270169539, 'max_depth': 10, 'num_leaves': 82, 'min_child_samples': 53, 'colsample_bytree': 0.6943818405756852, 'subsample': 0.8498157430398939, 'reg_alpha': 0.027363949146849392, 'reg_lambda': 0.00014542666999071592}. Best is trial 19 with value: 0.9121942635931726.


🏃 View run Trial_21_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/1c32addf9a0e4b25a72196e269d422b9
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.456516 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 85372
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2200
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:13:34,786] Trial 22 finished with value: 0.877705437269048 and parameters: {'n_estimators': 582, 'learning_rate': 0.016306429902060552, 'max_depth': 10, 'num_leaves': 65, 'min_child_samples': 31, 'colsample_bytree': 0.7160829777555895, 'subsample': 0.7163230309381352, 'reg_alpha': 0.013717006112728556, 'reg_lambda': 0.0001056426151721643}. Best is trial 19 with value: 0.9121942635931726.


🏃 View run Trial_22_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/f97b98d2be424095bfa8d32ece190dd7
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.413979 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 71106
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1245
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:14:09,376] Trial 23 finished with value: 0.8945979236318846 and parameters: {'n_estimators': 829, 'learning_rate': 0.04448322670162584, 'max_depth': 10, 'num_leaves': 90, 'min_child_samples': 56, 'colsample_bytree': 0.5087050474606425, 'subsample': 0.9571113305829544, 'reg_alpha': 0.2311770663812741, 'reg_lambda': 0.0006049496229887651}. Best is trial 19 with value: 0.9121942635931726.


🏃 View run Trial_23_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/1e2b5fadbd8f495aaee3a22ee11e0029
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.557961 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 90630
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2703
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:14:45,391] Trial 24 finished with value: 0.8764736934717579 and parameters: {'n_estimators': 808, 'learning_rate': 0.014623602953879475, 'max_depth': 8, 'num_leaves': 102, 'min_child_samples': 25, 'colsample_bytree': 0.8212818541112854, 'subsample': 0.858670771683543, 'reg_alpha': 0.36118183743487836, 'reg_lambda': 0.001334209968199448}. Best is trial 19 with value: 0.9121942635931726.


🏃 View run Trial_24_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/13677736bafd4050aa96a50331022807
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.267847 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 74425
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1423
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:15:15,321] Trial 25 finished with value: 0.9019883864156255 and parameters: {'n_estimators': 646, 'learning_rate': 0.04385594101727628, 'max_depth': 13, 'num_leaves': 55, 'min_child_samples': 49, 'colsample_bytree': 0.8883910429532594, 'subsample': 0.761363713201469, 'reg_alpha': 0.027865445967002973, 'reg_lambda': 0.0002526406832958305}. Best is trial 19 with value: 0.9121942635931726.


🏃 View run Trial_25_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/fc456bca392646209ad9c80c1d74edb9
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.398323 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 84056
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2090
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:15:49,188] Trial 26 finished with value: 0.9181770191800106 and parameters: {'n_estimators': 630, 'learning_rate': 0.048054012220086394, 'max_depth': 13, 'num_leaves': 49, 'min_child_samples': 33, 'colsample_bytree': 0.8884437016161743, 'subsample': 0.7590814887726001, 'reg_alpha': 0.024673150443044717, 'reg_lambda': 0.00020375077355364054}. Best is trial 26 with value: 0.9181770191800106.


🏃 View run Trial_26_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/ab47913cac9342498be6c211a110cd66
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.441371 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 85372
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2200
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:16:26,294] Trial 27 finished with value: 0.8699630476860813 and parameters: {'n_estimators': 519, 'learning_rate': 0.011975844961047814, 'max_depth': 13, 'num_leaves': 49, 'min_child_samples': 31, 'colsample_bytree': 0.9474869134123303, 'subsample': 0.7531785602742143, 'reg_alpha': 0.003099107173059697, 'reg_lambda': 0.0002591265932836776}. Best is trial 26 with value: 0.9181770191800106.


🏃 View run Trial_27_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/06c09f270e4d46f1847e23d0ac056103
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.355294 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 79942
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1776
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:17:00,119] Trial 28 finished with value: 0.8236846735878938 and parameters: {'n_estimators': 635, 'learning_rate': 0.0041543825604903155, 'max_depth': 13, 'num_leaves': 26, 'min_child_samples': 39, 'colsample_bytree': 0.8856975048248965, 'subsample': 0.7645532707649981, 'reg_alpha': 0.07662354142355846, 'reg_lambda': 0.0002616515172893979}. Best is trial 26 with value: 0.9181770191800106.


🏃 View run Trial_28_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/8322d174512b4e5eb9be084cc5b71a9d
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 2.108737 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 116828
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 6864
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:17:44,144] Trial 29 finished with value: 0.9313742741509766 and parameters: {'n_estimators': 453, 'learning_rate': 0.05539908413474968, 'max_depth': 14, 'num_leaves': 40, 'min_child_samples': 10, 'colsample_bytree': 0.8415911556969558, 'subsample': 0.6415932664171768, 'reg_alpha': 0.023761644448654876, 'reg_lambda': 0.0012876050573429048}. Best is trial 29 with value: 0.9313742741509766.


🏃 View run Trial_29_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/10c0b632c01b41ba89b6e98e7f3a9bb9
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 2.540482 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 113733
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 6244
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:18:34,088] Trial 30 finished with value: 0.780573640682738 and parameters: {'n_estimators': 468, 'learning_rate': 0.0006120678000615081, 'max_depth': 14, 'num_leaves': 38, 'min_child_samples': 11, 'colsample_bytree': 0.8152229467077992, 'subsample': 0.6477358666349338, 'reg_alpha': 0.0049427959007781715, 'reg_lambda': 0.0013104802727713777}. Best is trial 29 with value: 0.9313742741509766.


🏃 View run Trial_30_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/3babcbb357ae4927999bce376f532464
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.420008 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 99702
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3817
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:19:12,571] Trial 31 finished with value: 0.9377089565370403 and parameters: {'n_estimators': 645, 'learning_rate': 0.0544462673025585, 'max_depth': 13, 'num_leaves': 24, 'min_child_samples': 18, 'colsample_bytree': 0.8840289021091081, 'subsample': 0.6049390013948165, 'reg_alpha': 0.024076556097195834, 'reg_lambda': 0.0004700448841300435}. Best is trial 31 with value: 0.9377089565370403.


🏃 View run Trial_31_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/56bc36a71628410599fe75032d083534
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.862662 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 99702
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3817
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:19:44,558] Trial 32 finished with value: 0.9343656519443956 and parameters: {'n_estimators': 412, 'learning_rate': 0.05970333530767779, 'max_depth': 15, 'num_leaves': 21, 'min_child_samples': 18, 'colsample_bytree': 0.8703589766494432, 'subsample': 0.6050161565605678, 'reg_alpha': 0.014416426253153982, 'reg_lambda': 0.0006260897668672947}. Best is trial 31 with value: 0.9377089565370403.


🏃 View run Trial_32_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/c755351642b5426aa931558b55d249a9
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.895157 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 99702
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3817
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:20:18,706] Trial 33 finished with value: 0.9348935421432342 and parameters: {'n_estimators': 429, 'learning_rate': 0.06047588837585985, 'max_depth': 15, 'num_leaves': 25, 'min_child_samples': 18, 'colsample_bytree': 0.8519109785685428, 'subsample': 0.6090752735839238, 'reg_alpha': 0.015448216461160185, 'reg_lambda': 0.0007854357048005045}. Best is trial 31 with value: 0.9377089565370403.


🏃 View run Trial_33_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/529fc0cc6b5542baa22e738d9997c1c3
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 1.689628 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 101206
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4032
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:20:54,143] Trial 34 finished with value: 0.9370051029385887 and parameters: {'n_estimators': 411, 'learning_rate': 0.06503184013876594, 'max_depth': 15, 'num_leaves': 22, 'min_child_samples': 17, 'colsample_bytree': 0.8500206339381309, 'subsample': 0.5805764268888737, 'reg_alpha': 0.0016348484027408734, 'reg_lambda': 0.0006248986855325014}. Best is trial 31 with value: 0.9377089565370403.


🏃 View run Trial_34_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/241e0c2ddfa34207b1d5baebd682f7ef
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.907241 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 99702
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3817
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:21:24,644] Trial 35 finished with value: 0.936653176139363 and parameters: {'n_estimators': 402, 'learning_rate': 0.07061387718986605, 'max_depth': 15, 'num_leaves': 22, 'min_child_samples': 18, 'colsample_bytree': 0.7786503689793443, 'subsample': 0.5952006922988422, 'reg_alpha': 0.0008080312914237612, 'reg_lambda': 0.00048024382565924165}. Best is trial 31 with value: 0.9377089565370403.


🏃 View run Trial_35_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/c4b6f0ca1df74b589ad3399eff37e782
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.813927 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 98233
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3607
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:21:53,474] Trial 36 finished with value: 0.9392926271335562 and parameters: {'n_estimators': 364, 'learning_rate': 0.09970358882010606, 'max_depth': 15, 'num_leaves': 30, 'min_child_samples': 19, 'colsample_bytree': 0.759854658218684, 'subsample': 0.5617362420205556, 'reg_alpha': 0.0009894944126514914, 'reg_lambda': 0.01631735067352786}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_36_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/2f7b7cdcf1714233aacf7ed39e406d0a
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.632537 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 91682
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2820
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:22:20,302] Trial 37 finished with value: 0.9329579447474925 and parameters: {'n_estimators': 370, 'learning_rate': 0.09923616103753169, 'max_depth': 14, 'num_leaves': 31, 'min_child_samples': 24, 'colsample_bytree': 0.7465410189750827, 'subsample': 0.5586448677770411, 'reg_alpha': 0.0010926350509977579, 'reg_lambda': 0.10607753933882468}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_37_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/56f628d4f54246fe8e9549e91edc41e5
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.027314 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102905
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4275
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:22:44,753] Trial 38 finished with value: 0.9069153616047863 and parameters: {'n_estimators': 166, 'learning_rate': 0.07456895569101481, 'max_depth': 15, 'num_leaves': 33, 'min_child_samples': 16, 'colsample_bytree': 0.7532503434191259, 'subsample': 0.5013674356638474, 'reg_alpha': 0.00032487860759223576, 'reg_lambda': 0.013080624387454666}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_38_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/67f0e80791b54824a94ca1180c892a8b
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.584129 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89792
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2619
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:23:10,338] Trial 39 finished with value: 0.8768256202709837 and parameters: {'n_estimators': 290, 'learning_rate': 0.022674729456711742, 'max_depth': 14, 'num_leaves': 29, 'min_child_samples': 26, 'colsample_bytree': 0.7908975541033626, 'subsample': 0.5342831060053901, 'reg_alpha': 0.0011544814522322492, 'reg_lambda': 0.002540799415397931}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_39_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/9b5e452be4454e7c9fd990572dd90248
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.138509 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 104753
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4583
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:23:40,386] Trial 40 finished with value: 0.8428646841456977 and parameters: {'n_estimators': 331, 'learning_rate': 0.010035619629312232, 'max_depth': 15, 'num_leaves': 20, 'min_child_samples': 15, 'colsample_bytree': 0.6559193979395294, 'subsample': 0.5839996567171925, 'reg_alpha': 0.00039771731967477587, 'reg_lambda': 0.07074929689965503}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_40_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/3dba7cc5254b4d9194c4d520b61e0aaa
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.751784 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 95360
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3247
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:24:14,601] Trial 41 finished with value: 0.9345416153440085 and parameters: {'n_estimators': 490, 'learning_rate': 0.06867144775581277, 'max_depth': 15, 'num_leaves': 26, 'min_child_samples': 21, 'colsample_bytree': 0.8356833306589415, 'subsample': 0.58518477841553, 'reg_alpha': 0.0019348119739467798, 'reg_lambda': 0.0007193519778103264}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_41_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/b9da4b19dabd41839308d64927dd2cb6
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.222479 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 106486
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4872
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:24:53,861] Trial 42 finished with value: 0.7812774942811895 and parameters: {'n_estimators': 375, 'learning_rate': 0.00013225202558646897, 'max_depth': 14, 'num_leaves': 35, 'min_child_samples': 14, 'colsample_bytree': 0.7772069478786287, 'subsample': 0.5475051395270646, 'reg_alpha': 0.0006601755110824347, 'reg_lambda': 0.0004350944062660251}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_42_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/e7f3c782a7b74f5c93015bd64b33d2f1
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.769383 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 97047
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3458
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:25:18,813] Trial 43 finished with value: 0.9304944571529122 and parameters: {'n_estimators': 211, 'learning_rate': 0.09759105398336357, 'max_depth': 15, 'num_leaves': 42, 'min_child_samples': 20, 'colsample_bytree': 0.7288663630236298, 'subsample': 0.6116120614016572, 'reg_alpha': 0.00749659632760168, 'reg_lambda': 0.0023632023392390093}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_43_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/16691b15cba14312aa7192fa5284066e
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.569434 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89792
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2619
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:25:47,614] Trial 44 finished with value: 0.7582262889319021 and parameters: {'n_estimators': 410, 'learning_rate': 0.0002659964329627994, 'max_depth': 13, 'num_leaves': 21, 'min_child_samples': 26, 'colsample_bytree': 0.858107076850405, 'subsample': 0.6715136974465769, 'reg_alpha': 0.0001842217129233019, 'reg_lambda': 0.01970945228512842}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_44_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/547416a2256f407086a83454d17c982e
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.221253 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 97047
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3458
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:26:23,723] Trial 45 finished with value: 0.9005806792187225 and parameters: {'n_estimators': 544, 'learning_rate': 0.01980542985413324, 'max_depth': 15, 'num_leaves': 27, 'min_child_samples': 20, 'colsample_bytree': 0.7813010610083189, 'subsample': 0.5692306363901107, 'reg_alpha': 0.002919668679989723, 'reg_lambda': 0.0012295645688822556}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_45_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/653694befe8d4326aa44d8d55c9b4f2f
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.223381 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 59649
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 773
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:26:45,297] Trial 46 finished with value: 0.8618687313038887 and parameters: {'n_estimators': 333, 'learning_rate': 0.06512494496300686, 'max_depth': 12, 'num_leaves': 34, 'min_child_samples': 88, 'colsample_bytree': 0.9667163930822007, 'subsample': 0.5313973472741824, 'reg_alpha': 0.0015830694473537095, 'reg_lambda': 0.18795401917667365}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_46_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/784839294030456aa8409f6706d1c252
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.228501 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 106486
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4872
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:27:25,166] Trial 47 finished with value: 0.9151856413865916 and parameters: {'n_estimators': 451, 'learning_rate': 0.033664925549348634, 'max_depth': 14, 'num_leaves': 44, 'min_child_samples': 14, 'colsample_bytree': 0.8290088049231927, 'subsample': 0.5946559751398943, 'reg_alpha': 0.0069629766114962495, 'reg_lambda': 0.0004344220219526452}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_47_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/8f19624815bb4967a4b39b1d9a7751df
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.558555 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 88903
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2530
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:27:57,862] Trial 48 finished with value: 0.9283828963575577 and parameters: {'n_estimators': 500, 'learning_rate': 0.07643833610605105, 'max_depth': 15, 'num_leaves': 150, 'min_child_samples': 27, 'colsample_bytree': 0.801975118917914, 'subsample': 0.6358446414201504, 'reg_alpha': 0.0006147175228999016, 'reg_lambda': 0.46588260866749703}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_48_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/7a7e5fa7bbca467c9b66c616958b3b61
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.656562 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 94089
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3088
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:28:33,455] Trial 49 finished with value: 0.8141826500087982 and parameters: {'n_estimators': 277, 'learning_rate': 0.007080217172050472, 'max_depth': 13, 'num_leaves': 129, 'min_child_samples': 22, 'colsample_bytree': 0.8617971031995446, 'subsample': 0.6686658979982558, 'reg_alpha': 0.00026642874555621077, 'reg_lambda': 0.0028916238167854508}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_49_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/dd7ec24c9b4445ec80dd431819f3850e
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 2.591197 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 116828
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 6864
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:29:12,799] Trial 50 finished with value: 0.7858525426711244 and parameters: {'n_estimators': 387, 'learning_rate': 0.0027682691847588973, 'max_depth': 11, 'num_leaves': 24, 'min_child_samples': 10, 'colsample_bytree': 0.7612366564984467, 'subsample': 0.5646605521308489, 'reg_alpha': 0.000691486398838436, 'reg_lambda': 0.045977253133214276}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_50_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/430c280859b941e8b3f57ef55bf75cfb
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.813437 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 98233
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3607
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:29:47,417] Trial 51 finished with value: 0.9348935421432342 and parameters: {'n_estimators': 480, 'learning_rate': 0.055035132217095585, 'max_depth': 15, 'num_leaves': 28, 'min_child_samples': 19, 'colsample_bytree': 0.8384814324675297, 'subsample': 0.5852483171107608, 'reg_alpha': 0.001975422049076963, 'reg_lambda': 0.0008668530289079308}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_51_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/0549d35d9d894419a1fa956352d4cacb
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.053929 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102905
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4275
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:30:21,637] Trial 52 finished with value: 0.9333098715467183 and parameters: {'n_estimators': 419, 'learning_rate': 0.05367053655759804, 'max_depth': 15, 'num_leaves': 31, 'min_child_samples': 16, 'colsample_bytree': 0.8464588965456176, 'subsample': 0.6167387330135928, 'reg_alpha': 0.0018379299739441606, 'reg_lambda': 0.0009577222725213183}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_52_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/17806a0f9bcf478ea35af0496abd15a5
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.500463 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 87953
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2435
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:30:52,410] Trial 53 finished with value: 0.8986450818229809 and parameters: {'n_estimators': 320, 'learning_rate': 0.031898611200407025, 'max_depth': 14, 'num_leaves': 36, 'min_child_samples': 28, 'colsample_bytree': 0.8765926696218533, 'subsample': 0.5362065806378459, 'reg_alpha': 0.004357684475743806, 'reg_lambda': 0.00051283658500807}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_53_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/eba55ac7d96646e690ef671887ab9bef
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.837733 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 98233
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3607
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:31:22,834] Trial 54 finished with value: 0.9378849199366531 and parameters: {'n_estimators': 441, 'learning_rate': 0.07799019622440423, 'max_depth': 14, 'num_leaves': 20, 'min_child_samples': 19, 'colsample_bytree': 0.8099402573238552, 'subsample': 0.598204012744061, 'reg_alpha': 0.009717710921519025, 'reg_lambda': 0.00203913246513761}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_54_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/3682b42801494abbbed6b83f54b759b0
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 2.315223 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 108854
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5268
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:31:49,591] Trial 55 finished with value: 0.9239838113672356 and parameters: {'n_estimators': 232, 'learning_rate': 0.08153928765819832, 'max_depth': 14, 'num_leaves': 20, 'min_child_samples': 13, 'colsample_bytree': 0.8030370839662718, 'subsample': 0.6598882127230746, 'reg_alpha': 0.01198772672787817, 'reg_lambda': 0.001859503784243607}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_55_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/4709fd390cb846279776d2f0b9476a89
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.393139 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 81757
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1909
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:32:21,717] Trial 56 finished with value: 0.9169452753827204 and parameters: {'n_estimators': 763, 'learning_rate': 0.0986797282033016, 'max_depth': 12, 'num_leaves': 25, 'min_child_samples': 36, 'colsample_bytree': 0.766811331357412, 'subsample': 0.6261534171596842, 'reg_alpha': 0.05616306323658215, 'reg_lambda': 0.006038913511641784}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_56_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/2b69f4a9dff8486586a2b2e043f07ad2
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.337688 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 77457
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1607
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:32:41,074] Trial 57 finished with value: 0.8516628541263417 and parameters: {'n_estimators': 556, 'learning_rate': 0.03570720676662766, 'max_depth': 3, 'num_leaves': 38, 'min_child_samples': 43, 'colsample_bytree': 0.7447334026696206, 'subsample': 0.6877105749321578, 'reg_alpha': 0.009918387000990752, 'reg_lambda': 0.00017520017296625078}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_57_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/fde5df4d58de4d99b82ea56052146b6c
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.030096 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 92752
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2939
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:33:09,646] Trial 58 finished with value: 0.7233855358085518 and parameters: {'n_estimators': 435, 'learning_rate': 0.0014912336604748562, 'max_depth': 5, 'num_leaves': 32, 'min_child_samples': 23, 'colsample_bytree': 0.9450912363558751, 'subsample': 0.6034109037055205, 'reg_alpha': 0.03672530893646601, 'reg_lambda': 0.003547506614920813}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_58_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/dff14004c18b4290af5d56e76c04ecba
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.926953 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 101206
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4032
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:33:44,120] Trial 59 finished with value: 0.8921344360373042 and parameters: {'n_estimators': 359, 'learning_rate': 0.027562970693667085, 'max_depth': 13, 'num_leaves': 46, 'min_child_samples': 17, 'colsample_bytree': 0.9015563763446961, 'subsample': 0.5192278386608166, 'reg_alpha': 0.00010046854429536659, 'reg_lambda': 0.0003198525978698326}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_59_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/de480a2c479f4f00b5d73be948b43d1c
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.523094 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 87953
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2435
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:34:07,364] Trial 60 finished with value: 0.9236318845680098 and parameters: {'n_estimators': 300, 'learning_rate': 0.06939833386728982, 'max_depth': 15, 'num_leaves': 24, 'min_child_samples': 28, 'colsample_bytree': 0.6635786022822966, 'subsample': 0.55392422004866, 'reg_alpha': 0.018641218343707255, 'reg_lambda': 0.010797336647428319}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_60_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/9e302e4c72bc4843959e2536952ced2f
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.891620 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 99702
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3817
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:34:41,723] Trial 61 finished with value: 0.9347175787436214 and parameters: {'n_estimators': 485, 'learning_rate': 0.05137210018089143, 'max_depth': 14, 'num_leaves': 29, 'min_child_samples': 18, 'colsample_bytree': 0.8279362404298616, 'subsample': 0.5787323371986626, 'reg_alpha': 0.0055066715761329784, 'reg_lambda': 0.0007847026045135076}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_61_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/6d4d0e505c6e4772b44743a949392f31
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.708999 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 94089
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3088
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:35:16,739] Trial 62 finished with value: 0.9340137251451698 and parameters: {'n_estimators': 518, 'learning_rate': 0.05564327917304468, 'max_depth': 15, 'num_leaves': 28, 'min_child_samples': 22, 'colsample_bytree': 0.8486918287236569, 'subsample': 0.5916710055027943, 'reg_alpha': 0.003042076906908053, 'reg_lambda': 0.0019983602576390557}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_62_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/6330104b8c3048be907dcae1c0c53f37
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 2.015274 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:35:59,624] Trial 63 finished with value: 0.9336617983459441 and parameters: {'n_estimators': 567, 'learning_rate': 0.0400539068921284, 'max_depth': 15, 'num_leaves': 20, 'min_child_samples': 12, 'colsample_bytree': 0.7982384052751548, 'subsample': 0.5710800098052572, 'reg_alpha': 0.0008517607757215979, 'reg_lambda': 0.0003805397506161702}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_63_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/9c4db7c60992449ea4300810a5ece49f
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.891609 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 98233
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3607
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:36:34,056] Trial 64 finished with value: 0.9377089565370403 and parameters: {'n_estimators': 449, 'learning_rate': 0.07914048688015166, 'max_depth': 14, 'num_leaves': 56, 'min_child_samples': 19, 'colsample_bytree': 0.8156761786168271, 'subsample': 0.624700458808784, 'reg_alpha': 0.0023304205915694477, 'reg_lambda': 0.0009409165847178247}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_64_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/a4e91d3318cd4f4fb65f16efedf917dd
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.507394 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 86087
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2265
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:37:02,525] Trial 65 finished with value: 0.9232799577687841 and parameters: {'n_estimators': 390, 'learning_rate': 0.07457569449605261, 'max_depth': 14, 'num_leaves': 61, 'min_child_samples': 30, 'colsample_bytree': 0.7240358073563318, 'subsample': 0.6255886424462215, 'reg_alpha': 0.0014249861675528965, 'reg_lambda': 0.001777558551397563}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_65_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/17da52e2dd4d4b25b20ad8a3f09bf3d3
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.612119 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 91682
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2820
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:37:32,345] Trial 66 finished with value: 0.9326060179482668 and parameters: {'n_estimators': 429, 'learning_rate': 0.08404664976697986, 'max_depth': 13, 'num_leaves': 41, 'min_child_samples': 24, 'colsample_bytree': 0.7852592614762636, 'subsample': 0.6547151000743446, 'reg_alpha': 0.01719478647703278, 'reg_lambda': 0.006551906349895862}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_66_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/30142aabf3b0474280bec886c689b048
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.251406 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 101206
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4032
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:38:21,335] Trial 67 finished with value: 0.9340137251451698 and parameters: {'n_estimators': 675, 'learning_rate': 0.04526535490759623, 'max_depth': 12, 'num_leaves': 54, 'min_child_samples': 17, 'colsample_bytree': 0.8152410549981813, 'subsample': 0.6016990830855187, 'reg_alpha': 0.0004371026482091291, 'reg_lambda': 0.0010308072363143233}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_67_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/37c32dbe24384fda827a1269edc224a9
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.407837 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 82571
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1972
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:38:55,012] Trial 68 finished with value: 0.9162414217842688 and parameters: {'n_estimators': 452, 'learning_rate': 0.06076408845647798, 'max_depth': 14, 'num_leaves': 50, 'min_child_samples': 35, 'colsample_bytree': 0.5820015593473339, 'subsample': 0.63249035125544, 'reg_alpha': 0.004155387576551898, 'reg_lambda': 0.00019693736181471467}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_68_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/5bb5ccfe1f23415ea0ce34ba33bc3f55
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.225259 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 106486
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4872
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:39:26,215] Trial 69 finished with value: 0.8660918528945979 and parameters: {'n_estimators': 254, 'learning_rate': 0.021690109562665556, 'max_depth': 14, 'num_leaves': 36, 'min_child_samples': 14, 'colsample_bytree': 0.900426091758763, 'subsample': 0.8104720790041305, 'reg_alpha': 0.10244936843780236, 'reg_lambda': 0.0005656021355529554}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_69_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/a54a0b788e9049e29fe5f26f5ce61490
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.337029 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 68219
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 1106
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:39:47,744] Trial 70 finished with value: 0.8342424775646665 and parameters: {'n_estimators': 338, 'learning_rate': 0.015693480464753003, 'max_depth': 9, 'num_leaves': 23, 'min_child_samples': 62, 'colsample_bytree': 0.8701883028515218, 'subsample': 0.5473767038153386, 'reg_alpha': 0.0002321316845730048, 'reg_lambda': 1.9097101280058952}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_70_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/9e3874c2ebde4e60b762919bcd6b1459
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.872074 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 98233
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3607
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:40:23,410] Trial 71 finished with value: 0.9343656519443956 and parameters: {'n_estimators': 469, 'learning_rate': 0.051037797067969064, 'max_depth': 15, 'num_leaves': 28, 'min_child_samples': 19, 'colsample_bytree': 0.8203010248860562, 'subsample': 0.5808026808721579, 'reg_alpha': 0.0021482845565028545, 'reg_lambda': 0.001019451859575288}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_71_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/b70804f3d3c74ddb81fee4415b73ee56
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.813436 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 97047
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3458
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:40:59,849] Trial 72 finished with value: 0.9378849199366531 and parameters: {'n_estimators': 511, 'learning_rate': 0.08413490179649052, 'max_depth': 15, 'num_leaves': 32, 'min_child_samples': 20, 'colsample_bytree': 0.8395929550603587, 'subsample': 0.7327190395435205, 'reg_alpha': 0.0009700589874777594, 'reg_lambda': 0.0007852844430402962}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_72_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/57b60e1dd957485796e3739dbd84c2a9
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.689526 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 94089
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3088
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:41:32,291] Trial 73 finished with value: 0.9354214323420729 and parameters: {'n_estimators': 517, 'learning_rate': 0.08485359734039137, 'max_depth': 14, 'num_leaves': 32, 'min_child_samples': 22, 'colsample_bytree': 0.7756741095777164, 'subsample': 0.6808437440423869, 'reg_alpha': 0.0009386164032885408, 'reg_lambda': 0.0003248307583483945}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_73_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/19f93d9c9c8d4a82aedf753856a3450d
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.738418 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 94089
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 3088
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:42:08,015] Trial 74 finished with value: 0.9350695055428471 and parameters: {'n_estimators': 612, 'learning_rate': 0.08353699193490116, 'max_depth': 14, 'num_leaves': 34, 'min_child_samples': 22, 'colsample_bytree': 0.7729854576121364, 'subsample': 0.729762025460741, 'reg_alpha': 0.0009330921029531808, 'reg_lambda': 0.0001377532316085374}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_74_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/339f589370424c238c6dd79e009dc34b
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.493212 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 86900
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2339
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:42:37,708] Trial 75 finished with value: 0.9246876649656871 and parameters: {'n_estimators': 509, 'learning_rate': 0.08485308483778922, 'max_depth': 13, 'num_leaves': 39, 'min_child_samples': 29, 'colsample_bytree': 0.7390829508474459, 'subsample': 0.6961030030473837, 'reg_alpha': 0.0004701825789933223, 'reg_lambda': 0.0003430181439537846}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_75_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/a423b74cc1ad43bfb39b2e09915e5ef1
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.601857 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 90630
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 2703
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:43:13,693] Trial 76 finished with value: 0.9245117015660742 and parameters: {'n_estimators': 581, 'learning_rate': 0.03750515054661333, 'max_depth': 13, 'num_leaves': 44, 'min_child_samples': 25, 'colsample_bytree': 0.8095995863612286, 'subsample': 0.7132743859518634, 'reg_alpha': 0.0012675184084633556, 'reg_lambda': 0.0002704278574251099}. Best is trial 36 with value: 0.9392926271335562.


🏃 View run Trial_76_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/cf8d183e595f45a5989a0112aa9b9517
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.611817 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:43:56,999] Trial 77 finished with value: 0.9407003343304593 and parameters: {'n_estimators': 537, 'learning_rate': 0.06977583423194492, 'max_depth': 14, 'num_leaves': 31, 'min_child_samples': 12, 'colsample_bytree': 0.789186255834979, 'subsample': 0.7389368362368008, 'reg_alpha': 0.0008843887770866091, 'reg_lambda': 0.0016204967064176216}. Best is trial 77 with value: 0.9407003343304593.


🏃 View run Trial_77_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/81065b35877d4b0281fa6d0cfc5e81f8
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 2.561684 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 116828
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 6864
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:44:49,260] Trial 78 finished with value: 0.9417561147281366 and parameters: {'n_estimators': 544, 'learning_rate': 0.06777934209189987, 'max_depth': 14, 'num_leaves': 68, 'min_child_samples': 10, 'colsample_bytree': 0.7917734009291438, 'subsample': 0.7964379744197597, 'reg_alpha': 0.0026698680408938137, 'reg_lambda': 0.0016519341007931617}. Best is trial 78 with value: 0.9417561147281366.


🏃 View run Trial_78_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/67a1850a95c047f296175f02c0e95b14
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 2.985009 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 116828
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 6864
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:45:47,497] Trial 79 finished with value: 0.9146577511877529 and parameters: {'n_estimators': 544, 'learning_rate': 0.027793871277966304, 'max_depth': 14, 'num_leaves': 76, 'min_child_samples': 10, 'colsample_bytree': 0.788368791813413, 'subsample': 0.7765149156672173, 'reg_alpha': 0.002444575567501615, 'reg_lambda': 0.0032691803694136572}. Best is trial 78 with value: 0.9417561147281366.


🏃 View run Trial_79_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/aec569262ecc475e81fc82ee5a3c2f66
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.751205 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:46:36,599] Trial 80 finished with value: 0.9473869435157487 and parameters: {'n_estimators': 734, 'learning_rate': 0.09996404758330076, 'max_depth': 12, 'num_leaves': 68, 'min_child_samples': 12, 'colsample_bytree': 0.7591862290578595, 'subsample': 0.8095098802101697, 'reg_alpha': 0.006603534220899986, 'reg_lambda': 0.004401248579432732}. Best is trial 80 with value: 0.9473869435157487.


🏃 View run Trial_80_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/8cce18acc6134d9fb13381d63f844811
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.326285 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 106486
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4872
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:47:25,387] Trial 81 finished with value: 0.9438676755234912 and parameters: {'n_estimators': 764, 'learning_rate': 0.09882423114574092, 'max_depth': 13, 'num_leaves': 66, 'min_child_samples': 14, 'colsample_bytree': 0.7589681225540601, 'subsample': 0.8853458003400199, 'reg_alpha': 0.0065143518889292755, 'reg_lambda': 0.0015146316076936896}. Best is trial 80 with value: 0.9473869435157487.


🏃 View run Trial_81_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/19fe3172541e4bd3a2904e8a83a309db
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.637084 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:48:13,403] Trial 82 finished with value: 0.9463311631180714 and parameters: {'n_estimators': 740, 'learning_rate': 0.09841938015042959, 'max_depth': 12, 'num_leaves': 68, 'min_child_samples': 12, 'colsample_bytree': 0.7548864940596445, 'subsample': 0.8137774195203267, 'reg_alpha': 0.007961312196516074, 'reg_lambda': 0.004626565039695439}. Best is trial 80 with value: 0.9473869435157487.


🏃 View run Trial_82_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/afa452603a7b427099c111f9a91bedbe
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.623861 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:49:03,084] Trial 83 finished with value: 0.9465071265176843 and parameters: {'n_estimators': 869, 'learning_rate': 0.09309321798517724, 'max_depth': 11, 'num_leaves': 68, 'min_child_samples': 12, 'colsample_bytree': 0.7158209053383676, 'subsample': 0.870076166523505, 'reg_alpha': 0.006765128082550438, 'reg_lambda': 0.0041160016694277235}. Best is trial 80 with value: 0.9473869435157487.


🏃 View run Trial_83_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/6c91e124ea6d41bd98f9125a5bab0ebb
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.633051 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:49:53,921] Trial 84 finished with value: 0.9475629069153616 and parameters: {'n_estimators': 895, 'learning_rate': 0.09828378001350921, 'max_depth': 11, 'num_leaves': 69, 'min_child_samples': 12, 'colsample_bytree': 0.6858063002468717, 'subsample': 0.8944160724141117, 'reg_alpha': 0.010018047048982457, 'reg_lambda': 0.004287263957975249}. Best is trial 84 with value: 0.9475629069153616.


🏃 View run Trial_84_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/35c1e5d52dab472a94768d01c39056c0
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.408604 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 108854
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5268
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:50:42,464] Trial 85 finished with value: 0.9465071265176843 and parameters: {'n_estimators': 876, 'learning_rate': 0.09471306598560711, 'max_depth': 11, 'num_leaves': 68, 'min_child_samples': 13, 'colsample_bytree': 0.6868166664401362, 'subsample': 0.8765336068569968, 'reg_alpha': 0.00849242961206197, 'reg_lambda': 0.008132870507984313}. Best is trial 84 with value: 0.9475629069153616.


🏃 View run Trial_85_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/3d2ac7bc0bbc47be93b762bd1c29dcaa
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 2.601498 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:51:35,824] Trial 86 finished with value: 0.9472109801161358 and parameters: {'n_estimators': 876, 'learning_rate': 0.09960142628434467, 'max_depth': 11, 'num_leaves': 69, 'min_child_samples': 12, 'colsample_bytree': 0.685446795967319, 'subsample': 0.8745247286735859, 'reg_alpha': 0.006279109007166167, 'reg_lambda': 0.016678444470603272}. Best is trial 84 with value: 0.9475629069153616.


🏃 View run Trial_86_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/fdcb302602824284b0a67335cccd563e
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.702681 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:52:24,630] Trial 87 finished with value: 0.9477388703149745 and parameters: {'n_estimators': 857, 'learning_rate': 0.09658596309118676, 'max_depth': 11, 'num_leaves': 66, 'min_child_samples': 12, 'colsample_bytree': 0.6823042785803811, 'subsample': 0.875260206741876, 'reg_alpha': 0.00578804470654377, 'reg_lambda': 0.00847266911262021}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_87_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/bd0f2499f08049dc84fe8dc5b2638792
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 2.196989 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 116828
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 6864
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:53:21,880] Trial 88 finished with value: 0.9475629069153616 and parameters: {'n_estimators': 893, 'learning_rate': 0.09270286880745106, 'max_depth': 11, 'num_leaves': 69, 'min_child_samples': 10, 'colsample_bytree': 0.6696610534870643, 'subsample': 0.8791305848558533, 'reg_alpha': 0.006090530782770484, 'reg_lambda': 0.0078107769115813635}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_88_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/a7627a955c1649f4b613a2fb6d8491e3
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.553357 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 108854
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5268
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:54:12,327] Trial 89 finished with value: 0.9445715291219426 and parameters: {'n_estimators': 882, 'learning_rate': 0.09856482736979436, 'max_depth': 11, 'num_leaves': 73, 'min_child_samples': 13, 'colsample_bytree': 0.6782791954351851, 'subsample': 0.8784896189009296, 'reg_alpha': 0.007226754673219566, 'reg_lambda': 0.008986041841056312}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_89_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/bfb04d09965844dbb25acdf3b706f97a
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.614709 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:55:01,451] Trial 90 finished with value: 0.9472109801161358 and parameters: {'n_estimators': 871, 'learning_rate': 0.09990718739093273, 'max_depth': 11, 'num_leaves': 73, 'min_child_samples': 12, 'colsample_bytree': 0.6786282417341033, 'subsample': 0.9370901277782514, 'reg_alpha': 0.01059350187263165, 'reg_lambda': 0.007717890681202928}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_90_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/ed9b3121577347f694c607690145e0ed
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.651528 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:55:52,808] Trial 91 finished with value: 0.9472109801161358 and parameters: {'n_estimators': 878, 'learning_rate': 0.09046719854486902, 'max_depth': 11, 'num_leaves': 73, 'min_child_samples': 12, 'colsample_bytree': 0.6811014571208067, 'subsample': 0.940117881903322, 'reg_alpha': 0.009739367497249777, 'reg_lambda': 0.00796611330443235}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_91_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/db2195e579974585b062eea13ef8953b
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.151742 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 104753
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4583
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:57:04,449] Trial 92 finished with value: 0.786556396269576 and parameters: {'n_estimators': 874, 'learning_rate': 0.0006672875725121467, 'max_depth': 11, 'num_leaves': 78, 'min_child_samples': 15, 'colsample_bytree': 0.6266674182645665, 'subsample': 0.9293682017074434, 'reg_alpha': 0.01083502236859952, 'reg_lambda': 0.004572824514677665}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_92_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/932951d3e47e4c929737a39909ce13dd
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 2.217762 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:58:01,384] Trial 93 finished with value: 0.9399964807320077 and parameters: {'n_estimators': 945, 'learning_rate': 0.04557043926730073, 'max_depth': 11, 'num_leaves': 61, 'min_child_samples': 12, 'colsample_bytree': 0.7110026614133313, 'subsample': 0.9117653034555604, 'reg_alpha': 0.005250769703836534, 'reg_lambda': 0.02665218081476882}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_93_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/3292ab6c367b4a8eabed369d6c018d0d
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 2.185243 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 116828
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 6864
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:58:54,973] Trial 94 finished with value: 0.9419320781277495 and parameters: {'n_estimators': 858, 'learning_rate': 0.061347445591301175, 'max_depth': 10, 'num_leaves': 84, 'min_child_samples': 10, 'colsample_bytree': 0.638054405954124, 'subsample': 0.8702212133798224, 'reg_alpha': 0.003608203593676239, 'reg_lambda': 0.008200252861280394}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_94_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/8694df8b7e444fd292a075dd5ab81829
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 1.193870 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 104753
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4583
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 03:59:48,764] Trial 95 finished with value: 0.9438676755234912 and parameters: {'n_estimators': 991, 'learning_rate': 0.09982386780624121, 'max_depth': 12, 'num_leaves': 71, 'min_child_samples': 15, 'colsample_bytree': 0.6804997188225606, 'subsample': 0.8338880431453346, 'reg_alpha': 0.00891885479861848, 'reg_lambda': 0.015216527555396282}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_95_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/5611e780e12a43acaaff58fa526a2450
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 1.700730 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 04:00:44,653] Trial 96 finished with value: 0.9443955657223297 and parameters: {'n_estimators': 917, 'learning_rate': 0.061386331402931295, 'max_depth': 11, 'num_leaves': 68, 'min_child_samples': 12, 'colsample_bytree': 0.6225445400783391, 'subsample': 0.9369396304791425, 'reg_alpha': 0.014373798836455716, 'reg_lambda': 0.0067628606799327385}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_96_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/7912313186684cd3835490c16e031c3a
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 1.057955 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102905
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 4275
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 04:01:27,440] Trial 97 finished with value: 0.9415801513285237 and parameters: {'n_estimators': 834, 'learning_rate': 0.08461911657757787, 'max_depth': 10, 'num_leaves': 64, 'min_child_samples': 16, 'colsample_bytree': 0.6839731526587842, 'subsample': 0.9486721761326878, 'reg_alpha': 0.018314102126610797, 'reg_lambda': 0.020490016806279834}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_97_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/2779341c1f1b4f6aa3f02b08eb7fbea8
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.155532 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 56695
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 681
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 04:01:54,249] Trial 98 finished with value: 0.8572936829139539 and parameters: {'n_estimators': 900, 'learning_rate': 0.07176175718614825, 'max_depth': 11, 'num_leaves': 58, 'min_child_samples': 99, 'colsample_bytree': 0.6556951593311291, 'subsample': 0.9019000078122332, 'reg_alpha': 0.006005408513108251, 'reg_lambda': 0.011040050713003319}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_98_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/ca53bb96be3d49b697d022e98ccb9e12
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 1.622551 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000


[I 2025-03-08 04:03:04,507] Trial 99 finished with value: 0.8310751363716347 and parameters: {'n_estimators': 954, 'learning_rate': 0.004500543910568219, 'max_depth': 9, 'num_leaves': 87, 'min_child_samples': 12, 'colsample_bytree': 0.7075268286695848, 'subsample': 0.8250470995493089, 'reg_alpha': 0.036428887830938624, 'reg_lambda': 0.040039639286588456}. Best is trial 87 with value: 0.9477388703149745.


🏃 View run Trial_99_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/436574d7924742a5b0ebfed2d6c12f34
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216




[LightGBM] [Info] Number of positive: 12616, number of negative: 12616
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 1.765001 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 111143
[LightGBM] [Info] Number of data points in the train set: 25232, number of used features: 5726
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.500000 -> initscore=0.000000




🏃 View run Trial_Best_LightGBM_SMOTE_TFIDF_Trigrams at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216/runs/81ac30e030a04e0685dc2cdc5ed05358
🧪 View experiment at: http://ec2-100-26-36-125.compute-1.amazonaws.com:5000/#/experiments/621100004064027216
