In [29]:
import pandas as pd
import mlflow
from sklearn.model_selection import train_test_split
from sklearn.feature_extraction.text import TfidfVectorizer
import dagshub
dagshub.init(repo_owner='satyajeetrai007', repo_name='Youtube-Comment-Sentiment-Analysis', mlflow=True)
mlflow.set_experiment("Exp 8 - improving lightGBM")

<Experiment: artifact_location='mlflow-artifacts:/0f80bfb3ab1844079deb203b0e83ea1e', creation_time=1756303005428, experiment_id='8', last_update_time=1756303005428, lifecycle_stage='active', name='Exp 8 - improving lightGBM', tags={}>

In [30]:
dataset = dataset = pd.read_csv('data_preprocessed.csv')
cleaned_dataset = dataset.dropna().drop_duplicates()

In [31]:
# Separate features and target
X_cleaned = cleaned_dataset['clean_comment']
y_cleaned = cleaned_dataset['category']

In [32]:
# Split the cleaned data into train and test sets (80-20 split)
X_train_cleaned, X_test_cleaned, y_train_cleaned, y_test_cleaned = train_test_split(X_cleaned, y_cleaned, test_size=0.2, random_state=42)

In [33]:
# Apply TfidfVectorizer with trigram setting and max_features=1000
tfidf_cleaned = TfidfVectorizer(ngram_range=(1, 3), max_features=2000)

In [34]:
# Fit the vectorizer on the training data and transform both train and test sets
X_train_tfidf_cleaned = tfidf_cleaned.fit_transform(X_train_cleaned)
X_test_tfidf_cleaned = tfidf_cleaned.transform(X_test_cleaned)

In [35]:
import lightgbm as lgb
from sklearn.model_selection import train_test_split, cross_val_score
from sklearn.metrics import classification_report, accuracy_score
import optuna
import pickle

In [36]:
# Function to log results in MLflow
def log_mlflow(model_name, model, X_train, X_test, y_train, y_test, params, trial_number):
    with mlflow.start_run():
        # Log model type and trial number
        mlflow.set_tag("mlflow.runName", f"Trial_{trial_number}_{model_name}_class_weight_TFIDF_Trigrams")
        mlflow.set_tag("experiment_type", "algorithm_comparison")

        # Log algorithm name as a parameter
        mlflow.log_param("algo_name", model_name)

        # Log hyperparameters
        for key, value in params.items():
            mlflow.log_param(key, value)

        # Train model
        model.fit(X_train, y_train)
        y_pred = model.predict(X_test)

        # Log accuracy
        accuracy =  cross_val_score(model, X_train, y_train, cv=3, scoring='accuracy').mean()
        mlflow.log_metric("accuracy", accuracy)

        # Log classification report
        classification_rep = classification_report(y_test, y_pred, output_dict=True)
        for label, metrics in classification_rep.items():
            if isinstance(metrics, dict):
                for metric, value in metrics.items():
                    mlflow.log_metric(f"{label}_{metric}", value)

        # Save model artifact
        with open(f"{model_name}_model", "wb") as f:
            pickle.dump(model, f)
        mlflow.log_artifact(f"{model_name}_model", "model")
     
        return accuracy




In [37]:
# Function to optimize LightGBM hyperparameters
def objective(trial):
    # Define hyperparameters to be tuned
    param = {
        "objective": "multiclass",
        "num_class": 3,  # Assuming 3 categories (-1, 0, 1)
        "learning_rate": trial.suggest_float("learning_rate", 1e-3, 1e-1),
        "n_estimators": trial.suggest_int("n_estimators", 50, 500),
        "max_depth": trial.suggest_int("max_depth", 3, 20),
        "metric": "multi_logloss",
        "is_unbalance": True,
        "class_weight": "balanced",
    }

    # Define the LightGBM model with the trial parameters
    model = lgb.LGBMClassifier(**param)

    # Perform cross-validation
    accuracy = log_mlflow("LightGBM", model, X_train_tfidf_cleaned, X_test_tfidf_cleaned, y_train_cleaned, y_test_cleaned, param, trial.number)

    # Return the average score across folds
    return accuracy

In [38]:
# Create an Optuna study to optimize the hyperparameters
study = optuna.create_study(direction="maximize")
study.optimize(objective, n_trials=50)

[I 2025-08-28 00:12:40,320] A new study created in memory with name: no-name-e1e79383-a6be-492b-9b96-601806fe82ce


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.159890 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.043942 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.049363 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.066311 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_0_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/9dc018fcb65a4013b470857124b24a11
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:14:09,830] Trial 0 finished with value: 0.810822847539368 and parameters: {'learning_rate': 0.07926046343658844, 'n_estimators': 171, 'max_depth': 12}. Best is trial 0 with value: 0.810822847539368.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.061564 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.046743 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.043192 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.048485 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_1_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/815a779569264da5a4c26cdbed7ec8de
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:15:47,566] Trial 1 finished with value: 0.793508925237167 and parameters: {'learning_rate': 0.04473030193313525, 'n_estimators': 153, 'max_depth': 16}. Best is trial 0 with value: 0.810822847539368.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.315619 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.174623 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.188501 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.189462 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_2_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/b814d32aa28c4141a369ca07e1ce7c5e
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:17:48,098] Trial 2 finished with value: 0.8015795248724089 and parameters: {'learning_rate': 0.058340491198963, 'n_estimators': 280, 'max_depth': 8}. Best is trial 0 with value: 0.810822847539368.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.294092 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.210586 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.174855 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.179789 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_3_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/9dd8fbe6b46f435dad518e85d3c5d0bc
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:19:14,291] Trial 3 finished with value: 0.7668483854546743 and parameters: {'learning_rate': 0.09503152222272598, 'n_estimators': 169, 'max_depth': 4}. Best is trial 0 with value: 0.810822847539368.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.248297 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.179452 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.168440 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.165934 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_4_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/79b845cad47243c3bcbd31694fae71a6
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:21:20,982] Trial 4 finished with value: 0.8177898585791795 and parameters: {'learning_rate': 0.06423936019109834, 'n_estimators': 182, 'max_depth': 18}. Best is trial 4 with value: 0.8177898585791795.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.262609 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.211887 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.228219 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.217425 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_5_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/5dc23e754ac84805bb7ecdcac63d0e62
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:22:47,197] Trial 5 finished with value: 0.7461888268016067 and parameters: {'learning_rate': 0.06785598206163572, 'n_estimators': 216, 'max_depth': 3}. Best is trial 4 with value: 0.8177898585791795.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.286344 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.207105 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.214249 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.204344 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_6_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/74684ee05ce143a88197ab941ce86ff7
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:24:27,762] Trial 6 finished with value: 0.789921960739977 and parameters: {'learning_rate': 0.08372333913654331, 'n_estimators': 204, 'max_depth': 6}. Best is trial 4 with value: 0.8177898585791795.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.294456 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.223392 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.179828 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.219145 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_7_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/8fb72e3ee3344a539d72f556ca377d61
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:26:14,142] Trial 7 finished with value: 0.7861626062497645 and parameters: {'learning_rate': 0.05174425533277856, 'n_estimators': 150, 'max_depth': 12}. Best is trial 4 with value: 0.8177898585791795.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.284267 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.227250 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.221946 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.244734 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_8_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/527c76ef300041c9be1c896ee067cc28
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:28:21,974] Trial 8 finished with value: 0.8146167763852867 and parameters: {'learning_rate': 0.07037961275214918, 'n_estimators': 304, 'max_depth': 9}. Best is trial 4 with value: 0.8177898585791795.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.244925 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.215809 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.206668 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.210980 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_9_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/48df1a7a713c4ee08583ab8f9a21ab02
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:29:48,488] Trial 9 finished with value: 0.7638822925909811 and parameters: {'learning_rate': 0.08604786139713247, 'n_estimators': 77, 'max_depth': 9}. Best is trial 4 with value: 0.8177898585791795.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.333972 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.238647 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.250933 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.196628 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_10_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/dd971b9c038141c99913945a329344c5
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:33:05,889] Trial 10 finished with value: 0.8009242573222832 and parameters: {'learning_rate': 0.016539979510507626, 'n_estimators': 410, 'max_depth': 20}. Best is trial 4 with value: 0.8177898585791795.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.287998 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.180010 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.219004 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.231171 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_11_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/0895b4d41ede4dc4b238c17d24f7a9be
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:35:49,716] Trial 11 finished with value: 0.8119265396294634 and parameters: {'learning_rate': 0.031050080090692097, 'n_estimators': 344, 'max_depth': 16}. Best is trial 4 with value: 0.8177898585791795.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.307845 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.219934 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.204448 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.350100 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_12_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/43923c4b424d4efa84c501dd0089e1cc
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:39:15,554] Trial 12 finished with value: 0.8266193203555305 and parameters: {'learning_rate': 0.06960701888815397, 'n_estimators': 465, 'max_depth': 20}. Best is trial 12 with value: 0.8266193203555305.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.061291 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.044249 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.119644 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.049608 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_13_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/a1f945c11b5a4bb19a3398681051c0fd
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:42:12,077] Trial 13 finished with value: 0.7072152233657549 and parameters: {'learning_rate': 0.001816383225259774, 'n_estimators': 499, 'max_depth': 20}. Best is trial 12 with value: 0.8266193203555305.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.220402 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.149673 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.153539 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.209670 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_14_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/496404252ec84fcca57a42cc22e6a50d
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:45:35,878] Trial 14 finished with value: 0.8280333858086973 and parameters: {'learning_rate': 0.040988928680440365, 'n_estimators': 496, 'max_depth': 17}. Best is trial 14 with value: 0.8280333858086973.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.233145 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.198381 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.197680 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.162287 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_15_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/df230287ac334fcf8cc2516e90dfde12
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:48:55,628] Trial 15 finished with value: 0.8182381938996105 and parameters: {'learning_rate': 0.02869381724460232, 'n_estimators': 496, 'max_depth': 15}. Best is trial 14 with value: 0.8280333858086973.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.232222 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.169761 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.193933 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.184066 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_16_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/7aa4f347bf0d4fc7b516881616f1a71f
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:52:00,788] Trial 16 finished with value: 0.8281023667873771 and parameters: {'learning_rate': 0.04279475156611265, 'n_estimators': 431, 'max_depth': 18}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.152433 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.039009 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.045202 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.044381 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_17_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/81e3455b3a8b42318dd54087aa4cbbb4
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:54:03,521] Trial 17 finished with value: 0.8189969953714331 and parameters: {'learning_rate': 0.03964517131386423, 'n_estimators': 397, 'max_depth': 14}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.058033 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.043959 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.051216 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.049607 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_18_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/33e9bea2d8774e07b1214c1042234ab4
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:56:20,807] Trial 18 finished with value: 0.8068910209741574 and parameters: {'learning_rate': 0.01992170764803433, 'n_estimators': 424, 'max_depth': 18}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.085124 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.043441 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.051305 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.045774 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_19_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/35e1230e002240349d6f628c6c1c5d79
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 00:58:28,678] Trial 19 finished with value: 0.8231702892654478 and parameters: {'learning_rate': 0.039573713294722646, 'n_estimators': 356, 'max_depth': 18}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.136522 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.051610 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.091737 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.076336 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_20_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/86e364c1d4de4b34baf86c7cb20173ad
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:01:05,475] Trial 20 finished with value: 0.7844036144905093 and parameters: {'learning_rate': 0.014507044189325663, 'n_estimators': 447, 'max_depth': 14}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.245379 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.185754 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.195506 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.191357 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_21_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/b6e6fa863eb54f73a91b9f92fbe5b2e5
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:04:30,786] Trial 21 finished with value: 0.8276885273094585 and parameters: {'learning_rate': 0.053531106849084825, 'n_estimators': 462, 'max_depth': 20}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.060639 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.048131 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.048053 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.291714 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_22_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/1b8995c7028b4d66b5158b1014f40430
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:07:03,585] Trial 22 finished with value: 0.8271021800687262 and parameters: {'learning_rate': 0.05104854292978403, 'n_estimators': 375, 'max_depth': 17}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.260168 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.189079 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.126463 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.177323 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_23_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/35d84deb0ae748cbb23045bc97b8ed28
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:10:22,648] Trial 23 finished with value: 0.8248947994573168 and parameters: {'learning_rate': 0.03319038481021922, 'n_estimators': 442, 'max_depth': 19}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.342303 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.050349 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.074182 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.062027 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_24_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/314fe36076de462a9f9df77d4d7aaefd
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:12:57,780] Trial 24 finished with value: 0.8280334179277314 and parameters: {'learning_rate': 0.056236052858868714, 'n_estimators': 469, 'max_depth': 16}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.262518 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.051248 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.184563 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.185682 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_25_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/d8f31f271a754ce5a4e88f495e719a5a
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:15:27,018] Trial 25 finished with value: 0.8169965220082475 and parameters: {'learning_rate': 0.044842231033274386, 'n_estimators': 327, 'max_depth': 14}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.329762 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.059179 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.043245 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.048933 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_26_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/cbfecc7732e146d9bdf58c4029ec14db
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:18:02,900] Trial 26 finished with value: 0.8272056640274813 and parameters: {'learning_rate': 0.06165188178731902, 'n_estimators': 481, 'max_depth': 16}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.098475 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.052146 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.093800 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.171442 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_27_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/a2530d327dff4f49827b62551d2e6c2e
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:20:30,913] Trial 27 finished with value: 0.7964405757900712 and parameters: {'learning_rate': 0.02266640795337822, 'n_estimators': 394, 'max_depth': 13}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.066253 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.223016 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.172724 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.065728 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_28_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/64e90e8cd18e4cc7a73c6d2092d679c4
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:23:28,820] Trial 28 finished with value: 0.8273435831594623 and parameters: {'learning_rate': 0.04444952129441469, 'n_estimators': 429, 'max_depth': 17}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.174984 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.065717 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.041188 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.052944 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_29_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/251fbe807b5a44d39cf43f2991371d9a
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:25:43,469] Trial 29 finished with value: 0.8268262739979146 and parameters: {'learning_rate': 0.07458319788832904, 'n_estimators': 476, 'max_depth': 11}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.229257 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.260648 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.191821 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.054699 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_30_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/ade347115fbb491ab9222d8b6e56f119
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:28:06,257] Trial 30 finished with value: 0.8187210714567138 and parameters: {'learning_rate': 0.05634760874035961, 'n_estimators': 367, 'max_depth': 11}. Best is trial 16 with value: 0.8281023667873771.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.279829 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.201007 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.200525 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.194265 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_31_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/48a8a7c83897424db52c5fbde5887f24
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:31:25,393] Trial 31 finished with value: 0.8283782978396594 and parameters: {'learning_rate': 0.053823120473495044, 'n_estimators': 459, 'max_depth': 19}. Best is trial 31 with value: 0.8283782978396594.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.314007 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.052116 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.057356 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.048444 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_32_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/a396b3ac154942d4998375b66ab02afa
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:34:00,416] Trial 32 finished with value: 0.8256190979490641 and parameters: {'learning_rate': 0.03909286185116231, 'n_estimators': 448, 'max_depth': 17}. Best is trial 31 with value: 0.8283782978396594.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.095842 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.044231 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.067844 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.047991 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_33_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/24830eaf62624dca9e79839e7f29c7e1
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:36:39,755] Trial 33 finished with value: 0.8289646486491734 and parameters: {'learning_rate': 0.046521491543330344, 'n_estimators': 499, 'max_depth': 19}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.111020 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.056735 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.090965 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.055676 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_34_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/8aa4aff48417422d9865fd9330e42674
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:38:33,752] Trial 34 finished with value: 0.8209974187716768 and parameters: {'learning_rate': 0.04814887490853537, 'n_estimators': 256, 'max_depth': 19}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.061782 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.061077 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.041940 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.043909 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_35_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/b03191d63015492db08be41d3bf047a5
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:40:45,902] Trial 35 finished with value: 0.8275160766471497 and parameters: {'learning_rate': 0.06184630291136581, 'n_estimators': 412, 'max_depth': 19}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.058242 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.039808 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.041058 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.067287 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_36_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/dfb6b76751694b56a46f925fd25da72e
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:42:57,449] Trial 36 finished with value: 0.8278265142482889 and parameters: {'learning_rate': 0.05793342975451545, 'n_estimators': 452, 'max_depth': 15}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.059861 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.040689 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.048739 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.044993 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_37_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/d14083a147744014836748e0734f9c59
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:45:04,931] Trial 37 finished with value: 0.8226529408473029 and parameters: {'learning_rate': 0.03568745421105521, 'n_estimators': 390, 'max_depth': 18}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.060019 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.064531 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.044284 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.066778 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_38_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/83ce207bd4af414dbeb9f2942952a568
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:47:27,157] Trial 38 finished with value: 0.8282403251759552 and parameters: {'learning_rate': 0.046764415997628594, 'n_estimators': 470, 'max_depth': 19}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.060311 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.064532 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.045119 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.124227 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_39_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/750a6f3681dd478eb7f305a561b9527e
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:49:13,612] Trial 39 finished with value: 0.7981306079833358 and parameters: {'learning_rate': 0.026326033495689422, 'n_estimators': 250, 'max_depth': 19}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.073483 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.040268 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.043222 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.064200 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_40_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/14526d68d89b445c86af0a17804203cd
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:51:07,665] Trial 40 finished with value: 0.8233082512228074 and parameters: {'learning_rate': 0.04691364780966606, 'n_estimators': 297, 'max_depth': 18}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.068795 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.040358 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.053732 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.047337 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_41_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/76b205ad8d784860889931bfd4a0b6a3
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:53:31,989] Trial 41 finished with value: 0.8276195177805262 and parameters: {'learning_rate': 0.05281604602497015, 'n_estimators': 472, 'max_depth': 19}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.066426 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.060981 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.048182 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.052195 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_42_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/b1ed8cb7729142f8aacb2c2810fb6015
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:55:41,638] Trial 42 finished with value: 0.8283093489800137 and parameters: {'learning_rate': 0.05775414248512482, 'n_estimators': 429, 'max_depth': 16}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.062281 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.060996 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.053908 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.065166 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_43_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/387476cf84b24ba897d50f80c6570c39
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 01:57:55,818] Trial 43 finished with value: 0.8269642216801482 and parameters: {'learning_rate': 0.06537128799029411, 'n_estimators': 432, 'max_depth': 20}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.059579 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.064219 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.044157 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.046611 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_44_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/747869d88b9345c999ee60ca71083170
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 02:00:04,098] Trial 44 finished with value: 0.8265503714958848 and parameters: {'learning_rate': 0.07489999050128168, 'n_estimators': 414, 'max_depth': 18}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.068480 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.040718 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.072932 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.043770 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_45_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/972e89c6f40444eca4c57fbbfa22e724
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 02:01:38,789] Trial 45 finished with value: 0.7837827785448278 and parameters: {'learning_rate': 0.04460092700979816, 'n_estimators': 333, 'max_depth': 6}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.086537 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.062000 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.052476 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.055175 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_46_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/2b64e49a1678485c8a6bd34a10690873
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 02:03:07,229] Trial 46 finished with value: 0.8105814301735056 and parameters: {'learning_rate': 0.0918986668922981, 'n_estimators': 111, 'max_depth': 16}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.060001 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.042976 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.046633 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.044411 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_47_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/19e790f9d62349adbd6699a785c515db
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 02:05:31,616] Trial 47 finished with value: 0.8284817746608516 and parameters: {'learning_rate': 0.049922628675269115, 'n_estimators': 485, 'max_depth': 17}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.059854 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.038067 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.041598 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.043097 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_48_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/2ff7cba797ab4c0ca5a6e681e3dd0310
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 02:07:48,841] Trial 48 finished with value: 0.8278954702454979 and parameters: {'learning_rate': 0.04964233144567342, 'n_estimators': 500, 'max_depth': 15}. Best is trial 33 with value: 0.8289646486491734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.057608 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.044641 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72695
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1914
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.065795 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 73130
[LightGBM] [Info] Number of data points in the train set: 19329, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.067368 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 72472
[LightGBM] [Info] Number of data points in the train set: 19330, number of used features: 1915
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




🏃 View run Trial_49_LightGBM_class_weight_TFIDF_Trigrams at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8/runs/c0f47c4b239e42698653b10c63b7d08d
🧪 View experiment at: https://dagshub.com/satyajeetrai007/Youtube-Comment-Sentiment-Analysis.mlflow/#/experiments/8


[I 2025-08-28 02:10:07,126] Trial 49 finished with value: 0.8271022157565416 and parameters: {'learning_rate': 0.06037607566966323, 'n_estimators': 480, 'max_depth': 17}. Best is trial 33 with value: 0.8289646486491734.


In [39]:
# Extract the best hyperparameters
best_params = study.best_params
best_params

{'learning_rate': 0.046521491543330344, 'n_estimators': 499, 'max_depth': 19}

In [40]:
best_model = lgb.LGBMClassifier(

    objective='multiclass',
    num_class=3,
    metric="multi_logloss",
    is_unbalance= True,
    class_weight= "balanced",
    reg_alpha= 0.1,  # L1 regularization
    reg_lambda= 0.1,  # L2 regularization
    learning_rate= 0.0679484162034985,
    max_depth= 17,
    n_estimators=333
)

In [41]:
# Fit the model on the resampled training data
best_model.fit(X_train_tfidf_cleaned, y_train_cleaned)

[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.134328 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 102919
[LightGBM] [Info] Number of data points in the train set: 28994, number of used features: 1934
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


0,1,2
,boosting_type,'gbdt'
,num_leaves,31
,max_depth,17
,learning_rate,0.0679484162034985
,n_estimators,333
,subsample_for_bin,200000
,objective,'multiclass'
,class_weight,'balanced'
,min_split_gain,0.0
,min_child_weight,0.001


In [42]:
# Predict on the train set
y_train_pred = best_model.predict(X_train_tfidf_cleaned)



In [43]:
# Calculate accuracy on the test set
accuracy_train = accuracy_score(y_train_cleaned, y_train_pred)
accuracy_train

0.8915982617093192

In [44]:
# Generate classification report
report_train = classification_report(y_train_cleaned, y_train_pred)
print(report_train)

              precision    recall  f1-score   support

          -1       0.87      0.84      0.85      6543
           0       0.83      0.98      0.90      9984
           1       0.97      0.85      0.91     12467

    accuracy                           0.89     28994
   macro avg       0.89      0.89      0.89     28994
weighted avg       0.90      0.89      0.89     28994



In [45]:
# Predict on the test set
y_pred = best_model.predict(X_test_tfidf_cleaned)



In [46]:
# Calculate accuracy on the test set
accuracy = accuracy_score(y_test_cleaned, y_pred)
accuracy

0.8379086770589047

In [26]:
# Generate classification report
report = classification_report(y_test_cleaned, y_pred)
print(report)

              precision    recall  f1-score   support

          -1       0.76      0.74      0.75      1657
           0       0.81      0.96      0.88      2393
           1       0.91      0.80      0.85      3199

    accuracy                           0.84      7249
   macro avg       0.83      0.83      0.83      7249
weighted avg       0.84      0.84      0.84      7249



In [49]:
import re
import numpy as np

# Assuming you have pre-trained tfidf_vectorizer and lgbm_model loaded
# tfidf_vectorizer: Your trained TF-IDF vectorizer
# lgbm_model: Your trained LightGBM model

# Function to clean and preprocess a YouTube comment (same as used during training)
def preprocess_comment(comment):
    # Lowercasing
    comment = comment.lower()

    # Remove special characters, URLs, punctuation, and extra spaces
    comment = re.sub(r"http\S+|www\S+|https\S+", '', comment, flags=re.MULTILINE)  # Remove URLs
    comment = re.sub(r'\W', ' ', comment)  # Remove special characters
    comment = re.sub(r'\s+', ' ', comment).strip()  # Remove extra spaces and newlines

    return comment

# Prediction function
def predict_sentiment(comment, tfidf_vectorizer, lgbm_model):
    # Step 1: Preprocess the YouTube comment
    cleaned_comment = preprocess_comment(comment)

    # Step 2: Transform the comment using the trained TF-IDF vectorizer
    comment_tfidf = tfidf_vectorizer.transform([cleaned_comment])

    # Step 3: Use the trained LightGBM model to predict the sentiment
    prediction = lgbm_model.predict(comment_tfidf)
    prediction_proba = lgbm_model.predict_proba(comment_tfidf)

    # Step 4: Get the predicted sentiment (label) and probability
    sentiment_class = np.argmax(prediction_proba)
    sentiment_proba = np.max(prediction_proba)

    # Step 5: Return the sentiment label and confidence
    return {
        'sentiment_class': int(prediction[0]),  # -1, 0, or 1 depending on your labels
        'confidence': sentiment_proba
    }

# Example usage:
comment1 = "I absolutely hate this video!"
comment2 = "The explanations were confusing and the video quality was poor."
comment3 = "I didn’t learn anything useful. Really disappointed."
comment4 = "Wow, the explanation was so clear and helpful. Definitely subscribing!"
comment5 = "This is the worst video I’ve seen on this topic, very misleading"
comment6 = "Not much to say about this, just a standard video."
comment7 = "The video is okay, but I expected more depth in the content."
comment8 = "Superb content! Mazaa aa gaya dekh ke. Best video on this topic!"
comment9 = "Poor video quality aur explanation bhi weak tha."
comment10 = "Yeh video theek tha, but I was expecting more depth."
result = predict_sentiment(comment1, tfidf_cleaned, best_model)
print(f"Predicted Sentiment: {result['sentiment_class']}, Confidence: {result['confidence']}")

Predicted Sentiment: -1, Confidence: 0.9415004590733588


