In [1]:
# Install the libraries
# !pip install transformers datasets peft torch accelerate evaluate
!pip install -q transformers datasets peft torch accelerate evaluate # '-q' flag to quietly install the packages without showing the output logs

[?25l     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/75.1 kB[0m [31m?[0m eta [36m-:--:--[0m[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m75.1/75.1 kB[0m [31m6.3 MB/s[0m eta [36m0:00:00[0m
[?25h[?25l   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/511.6 kB[0m [31m?[0m eta [36m-:--:--[0m[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m511.6/511.6 kB[0m [31m30.3 MB/s[0m eta [36m0:00:00[0m
[?25h[?25l   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/556.4 kB[0m [31m?[0m eta [36m-:--:--[0m[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m556.4/556.4 kB[0m [31m45.1 MB/s[0m eta [36m0:00:00[0m
[?25h[?25l   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/84.1 kB[0m [31m?[0m eta [36m-:--:--[0m[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m84.1/84.1 kB[0m [31m9.5 MB/s[0m eta [36m0:00:00[0m
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━

In [2]:
import torch
import random
import numpy as np
import pandas as pd
import gc

# Import Hugging Face libraries
import evaluate
from datasets import load_dataset, Dataset, DatasetDict, IterableDataset, IterableDatasetDict
from transformers import AutoTokenizer, AutoModelForSequenceClassification, TrainingArguments, Trainer, DataCollatorWithPadding, EvalPrediction
from peft import LoraConfig, TaskType, get_peft_model



In [3]:
# Import the Python types
from typing import List, Dict, Any, Tuple, cast, Optional

from dataclasses import dataclass, asdict

In [4]:
import shutil
import os

if os.path.exists("/content/results"):
  shutil.rmtree("/content/results")

Constants

In [5]:
SEED = 42
TRAIN_SAMPLE_SIZE = 3000
TOTAL_TRIALS = 20
NUM_LABELS = 6
MAX_LENGTH = 128
MODEL = "distilbert-base-uncased"

Hyperparameters

In [6]:
# Search Space (Discrete Options)
WARMUP_OPTIONS = [0.0, 0.06, 0.1]
RANK_OPTIONS = [2, 4, 8, 16, 24, 32, 48]
ALPHA_OPTIONS = [8, 16, 32, 64, 96]
DROPOUT_OPTIONS = [0, 0.05, 0.1, 0.2]
TARGET_MODULE_OPTIONS = [
    ["q_lin", "v_lin"],                           # Index 0
    ["q_lin", "v_lin", "ffn.lin1", "ffn.lin2"]    # Index 1
]

In [7]:
def set_global_seed(seed: int):
  """
  Set the global seed for reproducibility.
  """
  random.seed(seed)
  np.random.seed(seed)
  torch.manual_seed(seed)

  # Check if CUDA GPU is available
  if torch.cuda.is_available():
    torch.cuda.manual_seed(seed)


In [8]:
set_global_seed(SEED)

In [9]:
class Individual:
  def __init__(self, genes: np.ndarray = None):
    if genes is None:
      self.genes = np.array([
        np.random.uniform(5e-6, 5e-4), # learning rate
        np.random.uniform(0.0, 0.1), # warmup ratio
        np.random.uniform(2, 24), # rank
        np.random.uniform(8, 96), # alpha
        np.random.uniform(0.0, 0.2), # dropout
        np.random.random() #v to choose between the target modules
      ])
    else:
      self.genes = genes.copy()

    self.fitness = None

  def decode(self):
    self.learning_rate = self.genes[0]
    self.warmup_ratio  = min(WARMUP_OPTIONS, key=lambda x: abs(x - self.genes[1]))
    self.rank = min(RANK_OPTIONS, key=lambda x: abs(x - self.genes[2]))
    self.alpha = min(ALPHA_OPTIONS, key=lambda x : abs(x - self.genes[3]))
    self.dropout = min(DROPOUT_OPTIONS, key=lambda x : abs(x - self.genes[4]))
    if self.genes[5] < 0.5:
      self.target_modules = ["q_lin", "v_lin"]
    else:
        self.target_modules = ["q_lin", "v_lin", "ffn.lin1", "ffn.lin2"]

In [10]:
# for the parents
def selection(population, num_parents):
  parents = []
  for i in range(num_parents):
    idx1, idx2 = random.sample(range(len(population)), 2)
    if population[idx1].fitness > population[idx2].fitness:
      parents.append(population[idx1])
    else:
      parents.append(population[idx2])
  return parents

# for the children
def crossover(parents, offspring_size):
  offspring = []
  for _ in range(offspring_size):
    parent1, parent2 = random.sample(parents, 2)
    crossover_point = random.randint(1, len(parent1.genes)-1)
    child_genes = np.concatenate([parent1.genes[:crossover_point], parent2.genes[crossover_point:]])
    offspring.append(Individual(child_genes))
  return offspring

# to create new children from current children (with different characteristics)
def mutation(individual: Individual, mutation_rate: float = 0.1, mutation_strength: float = 0.1):
    bounds = [(5e-6, 5e-4), (0.0, 0.1), (2, 24), (8, 96), (0.0, 0.2), (0.0, 1.0)]

    for i in range(len(individual.genes)):
        if random.random() < mutation_rate:
            low, high = bounds[i]
            range_size = high - low
            noise = np.random.normal(0, mutation_strength * range_size)
            individual.genes[i] = np.clip(individual.genes[i] + noise, low, high)


def blx_alpha_crossover(parent1: Individual, parent2: Individual, alpha: float=0.5) -> Individual:
  child_genes = np.zeros(len(parent1.genes))

  for i in range(len(parent1.genes)):
    g1, g2 = parent1.genes[i], parent2.genes[i]
    cmin, cmax = min(g1, g2), max(g1, g2)
    interval = cmax - cmin

    child_genes[i] = np.random.uniform(cmin - alpha * interval, cmax + alpha * interval)

    bounds = [(5e-6, 5e-4), (0.0, 0.1), (2, 24), (8, 96), (0.0, 0.2), (0.0, 1.0)]
    for i, (low, high) in enumerate(bounds):
        child_genes[i] = np.clip(child_genes[i], low, high)

    return Individual(child_genes)



# def fitness_function(individual):
#   individual.decode()
#   learning_rate = individual.learning_rate
#   warmup_ratio = individual.warmup_ratio
#   rank = individual.warmup_ratio
#   alpha = individual.alpha
#   dropout = individual.dropout
#   target_modules = individual.target_modules

#   print





In [11]:
class DataManager:
  def __init__(self, model_name: str = MODEL):
    self.tokenizer = AutoTokenizer.from_pretrained(model_name)
    self.dataset: Optional[Dict[str, Any]] = None

  def prepare_data(self) -> Dict[str, Any]:
    """
    Loads the dataset and processes it.
    """

    # Check if the dataset is correctly loaded into the instance memory
    if self.dataset is not None:
        return self.dataset

    print("Loading and processing data...")

    # Load full dataset
    full_dataset = cast(DatasetDict, load_dataset("dair-ai/emotion"))

    # Use seed to ensure every run uses the SAME subset of data
    train_subset = full_dataset["train"].shuffle(seed=SEED).select(range(TRAIN_SAMPLE_SIZE))

    # Private helper method for text embeddings
    def _tokenize(examples):
      return self.tokenizer(
        examples["text"],
        truncation=True,
        padding="max_length",
        max_length=MAX_LENGTH
      )

    tokenized_train_dataset = train_subset.map(_tokenize, batched=True)
    tokenized_validation_dataset = full_dataset["validation"].map(_tokenize, batched=True)

    self.dataset = {
        "train": tokenized_train_dataset,
        "validation": tokenized_validation_dataset,
        "tokenizer": self.tokenizer,
        "num_labels": NUM_LABELS
    }

    print("Data preparation complete.")

    return self.dataset

In [12]:
data_manager = DataManager()
data_bundle = data_manager.prepare_data()

The secret `HF_TOKEN` does not exist in your Colab secrets.
To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.
You will be able to reuse this secret in all of your notebooks.
Please note that authentication is recommended but still optional to access public models or datasets.


tokenizer_config.json:   0%|          | 0.00/48.0 [00:00<?, ?B/s]

config.json:   0%|          | 0.00/483 [00:00<?, ?B/s]

vocab.txt:   0%|          | 0.00/232k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/466k [00:00<?, ?B/s]

Loading and processing data...


README.md: 0.00B [00:00, ?B/s]

split/train-00000-of-00001.parquet:   0%|          | 0.00/1.03M [00:00<?, ?B/s]

split/validation-00000-of-00001.parquet:   0%|          | 0.00/127k [00:00<?, ?B/s]

split/test-00000-of-00001.parquet:   0%|          | 0.00/129k [00:00<?, ?B/s]

Generating train split:   0%|          | 0/16000 [00:00<?, ? examples/s]

Generating validation split:   0%|          | 0/2000 [00:00<?, ? examples/s]

Generating test split:   0%|          | 0/2000 [00:00<?, ? examples/s]

Map:   0%|          | 0/3000 [00:00<?, ? examples/s]

Map:   0%|          | 0/2000 [00:00<?, ? examples/s]

Data preparation complete.


# **RCGA-BLX-ALPHA Engine**

In [13]:
class RCGAExperiment:
    def __init__(self, data_bundle: Dict[str, Any]):
        self.data = data_bundle
        self.results: List[Dict[str, Any]] = []
        self.metric = evaluate.load("accuracy")
        self.trial_counter = 0

        # Bounds for the 6 genes
        self.min_bounds = np.array([5e-6, 0.0, 2, 8, 0.0, 0.0])
        self.max_bounds = np.array([5e-4, 0.1, 24, 96, 0.2, 1.0])

    def _compute_metrics(self, eval_pred: EvalPrediction) -> Dict[str, float]:
        predictions, labels = eval_pred
        predictions = np.argmax(predictions, axis=1)
        result = self.metric.compute(predictions=predictions, references=labels)
        return cast(Dict[str, float], result)

    def _cleanup_memory(self):
        torch.cuda.empty_cache()
        gc.collect()

    def train_model(self, trial_id: int, params: Individual) -> float:
        print(f"Params: LR={params.learning_rate:.2e}, Rank={params.rank}, Alpha={params.alpha}")

        model = AutoModelForSequenceClassification.from_pretrained(
            MODEL, num_labels=self.data["num_labels"]
        )

        peft_config = LoraConfig(
            task_type=TaskType.SEQ_CLS,
            r=params.rank,
            lora_alpha=params.alpha,
            lora_dropout=params.dropout,
            target_modules=params.target_modules
        )
        model = get_peft_model(model, peft_config)

        current_seed = SEED + trial_id

        args = TrainingArguments(
            output_dir=f"./results/rcga_trial_{trial_id}",
            learning_rate=params.learning_rate,
            per_device_train_batch_size=16,
            per_device_eval_batch_size=16,
            num_train_epochs=3,
            warmup_ratio=params.warmup_ratio,
            weight_decay=0.01,
            eval_strategy="epoch",
            save_strategy="no",
            logging_strategy="epoch",
            seed=current_seed,
            report_to="none",
            load_best_model_at_end=False,
            optim="adamw_torch"
        )

        data_collator = DataCollatorWithPadding(tokenizer=self.data["tokenizer"])

        trainer = Trainer(
            model=model,
            args=args,
            train_dataset=self.data["train"],
            eval_dataset=self.data["validation"],
            data_collator=data_collator,
            compute_metrics=self._compute_metrics
        )

        trainer.train()
        eval_results = trainer.evaluate()

        del model
        del trainer
        self._cleanup_memory()

        return eval_results["eval_accuracy"]

    def fitness_function(self, individual: Individual) -> float:
        self.trial_counter += 1

        individual.decode()  # Decode the genes to set learning_rate, rank, etc.

        try:
            accuracy = self.train_model(self.trial_counter, individual)  # ✅ Pass the individual directly
            print(f"Accuracy: {accuracy:.4%}")
            return accuracy
        except Exception as e:
          print(f"Error in Trial {self.trial_counter}: {e}")
          self._cleanup_memory()
          return 0.0

    def run_rcga(self, population_size: int = 20, generations: int = 10):
        print(f"Starting RCGA: {population_size} individuals, {generations} generations.")

        # 1. Initialization
        population = [Individual() for _ in range(population_size)]

        best_individual = None
        best_fitness = -float('inf')

        for gen in range(generations):
            print(f"\n{'='*50}")
            print(f"GENERATION {gen + 1}/{generations}")
            print(f"{'='*50}")

            # Evaluation
            for i, individual in enumerate(population):
                print(f"\n[Gen {gen+1}, Individual {i+1}/{population_size}]")
                individual.fitness = self.fitness_function(individual)

                # tracking best solution
                if individual.fitness > best_fitness:
                    best_fitness = individual.fitness
                    best_individual = Individual(individual.genes.copy())
                    print(f"NEW BEST FITNESS: {best_fitness:.4%}")

                # Log result
                individual.decode()
                record = {
                    "generation": gen + 1,
                    "trial_id": self.trial_counter,
                    "accuracy": individual.fitness,
                    "learning_rate": individual.learning_rate,
                    "warmup_ratio": individual.warmup_ratio,
                    "rank": individual.rank,
                    "alpha": individual.alpha,
                    "dropout": individual.dropout,
                    "target_modules": str(individual.target_modules)
                }
                self.results.append(record)

            # Stopping if last generation
            if gen == generations - 1:
                break

            # Selection
            num_parents = population_size // 2
            parents = selection(population, num_parents)

            # Crossover + Mutation
            offspring = []
            offspring.append(Individual(best_individual.genes.copy()))  # Elitism

            while len(offspring) < population_size:
                parent1, parent2 = random.sample(parents, 2)
                child = blx_alpha_crossover(parent1, parent2, alpha=0.5)
                mutation(child)
                offspring.append(child)

            # Replacing the population
            population = offspring

        print(f"\n{'='*50}")
        print("RCGA OPTIMIZATION COMPLETE")
        print(f"{'='*50}")
        print(f"Best Fitness: {best_fitness:.4%}")

        return best_individual, best_fitness

    def save_results(self, filename: str = "rcga_results.csv"):
        """Saves results to CSV and prints summary"""
        if not self.results:
            print("No results to save.")
            return

        df = pd.DataFrame(self.results)
        df.to_csv(filename, index=False)
        print(f"\nResults saved to {filename}")

        best_run = df.loc[df['accuracy'].idxmax()]
        print("\n" + "="*40)
        print("TOP RESULT:")
        print("="*40)
        print(f"Accuracy: {best_run['accuracy']:.4%}")
        print(f"Generation: {int(best_run['generation'])}")
        print(f"Rank: {int(best_run['rank'])}, Alpha: {int(best_run['alpha'])}")
        print(f"LR: {best_run['learning_rate']:.2e}")
        print(f"Warmup: {best_run['warmup_ratio']}")
        print(f"Dropout: {best_run['dropout']}")

In [14]:
experiment = RCGAExperiment(data_bundle)

# Use run_rcga() instead of run_experiment()
best_individual, best_fitness = experiment.run_rcga(population_size=20, generations=5)

experiment.save_results()

Downloading builder script: 0.00B [00:00, ?B/s]

Starting RCGA: 20 individuals, 5 generations.

GENERATION 1/5

[Gen 1, Individual 1/20]
Params: LR=1.90e-04, Rank=16, Alpha=64


model.safetensors:   0%|          | 0.00/268M [00:00<?, ?B/s]

Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy
1,1.2116,0.711431,0.733
2,0.5934,0.533686,0.8035
3,0.4571,0.483387,0.8305




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 83.0500%
NEW BEST FITNESS: 83.0500%

[Gen 1, Individual 2/20]
Params: LR=3.38e-05, Rank=16, Alpha=64




Epoch,Training Loss,Validation Loss,Accuracy
1,1.4677,1.146061,0.566
2,1.0341,0.942269,0.6785
3,0.879,0.876567,0.69




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 69.0000%

[Gen 1, Individual 3/20]
Params: LR=4.17e-04, Rank=8, Alpha=32




Epoch,Training Loss,Validation Loss,Accuracy
1,0.9258,0.464454,0.8325
2,0.3451,0.368918,0.8745
3,0.2101,0.336485,0.897




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 89.7000%
NEW BEST FITNESS: 89.7000%

[Gen 1, Individual 4/20]
Params: LR=2.19e-04, Rank=16, Alpha=16




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1895,0.786077,0.69
2,0.6773,0.61573,0.7745
3,0.5401,0.57091,0.7975




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.7500%

[Gen 1, Individual 5/20]
Params: LR=2.31e-04, Rank=8, Alpha=64




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1268,0.700072,0.7425
2,0.5774,0.492942,0.8245
3,0.4264,0.461921,0.834




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 83.4000%

[Gen 1, Individual 6/20]
Params: LR=3.06e-04, Rank=4, Alpha=96




Epoch,Training Loss,Validation Loss,Accuracy
1,0.9619,0.484381,0.843
2,0.3937,0.372468,0.8815
3,0.2344,0.315587,0.899




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 89.9000%
NEW BEST FITNESS: 89.9000%

[Gen 1, Individual 7/20]
Params: LR=1.56e-04, Rank=16, Alpha=32




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1901,0.849295,0.683
2,0.6907,0.625923,0.7735
3,0.5539,0.582808,0.7925




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.2500%

[Gen 1, Individual 8/20]
Params: LR=2.20e-05, Rank=8, Alpha=64




Epoch,Training Loss,Validation Loss,Accuracy
1,1.5563,1.317539,0.5385
2,1.1865,1.115696,0.5765
3,1.0674,1.064917,0.613




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 61.3000%

[Gen 1, Individual 9/20]
Params: LR=2.76e-04, Rank=24, Alpha=64




Epoch,Training Loss,Validation Loss,Accuracy
1,0.925,0.532889,0.823
2,0.3803,0.329128,0.89
3,0.2272,0.323735,0.8955




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 89.5500%

[Gen 1, Individual 10/20]
Params: LR=3.01e-04, Rank=4, Alpha=32




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1471,0.680157,0.7515
2,0.5631,0.487794,0.821
3,0.4101,0.457681,0.8375




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 83.7500%

[Gen 1, Individual 11/20]
Params: LR=1.97e-04, Rank=24, Alpha=32




Epoch,Training Loss,Validation Loss,Accuracy
1,1.0408,0.602267,0.767
2,0.4596,0.415342,0.861
3,0.2971,0.374145,0.8795




Accuracy: 87.9500%

[Gen 1, Individual 12/20]
Params: LR=7.48e-05, Rank=4, Alpha=96


Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy
1,1.3698,1.010449,0.643
2,0.8868,0.797104,0.702
3,0.7482,0.747102,0.7135




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 71.3500%

[Gen 1, Individual 13/20]
Params: LR=7.73e-06, Rank=16, Alpha=64




Epoch,Training Loss,Validation Loss,Accuracy
1,1.7304,1.630822,0.4545
2,1.5784,1.552908,0.4035
3,1.5384,1.537804,0.439




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 43.9000%

[Gen 1, Individual 14/20]
Params: LR=1.82e-04, Rank=24, Alpha=64




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1194,0.747861,0.725
2,0.6105,0.551001,0.8015
3,0.4745,0.50517,0.823




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 82.3000%

[Gen 1, Individual 15/20]
Params: LR=1.59e-04, Rank=16, Alpha=64




Epoch,Training Loss,Validation Loss,Accuracy
1,1.2252,0.807413,0.711
2,0.6617,0.590898,0.79
3,0.5332,0.54815,0.8015




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.1500%

[Gen 1, Individual 16/20]
Params: LR=6.42e-05, Rank=16, Alpha=64




Epoch,Training Loss,Validation Loss,Accuracy
1,1.3957,1.053444,0.628
2,0.9349,0.844831,0.6915
3,0.7942,0.799156,0.7045




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 70.4500%

[Gen 1, Individual 17/20]
Params: LR=2.64e-04, Rank=2, Alpha=16




Epoch,Training Loss,Validation Loss,Accuracy
1,1.116,0.647069,0.755
2,0.5072,0.442084,0.847
3,0.3402,0.416158,0.8605




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 86.0500%

[Gen 1, Individual 18/20]
Params: LR=1.61e-04, Rank=24, Alpha=32




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1722,0.670462,0.7435
2,0.5475,0.450021,0.8495
3,0.3581,0.410649,0.8655




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 86.5500%

[Gen 1, Individual 19/20]
Params: LR=1.18e-04, Rank=8, Alpha=16




Epoch,Training Loss,Validation Loss,Accuracy
1,1.2587,0.888584,0.6755
2,0.7419,0.661574,0.753
3,0.5826,0.590834,0.786




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 78.6000%

[Gen 1, Individual 20/20]
Params: LR=3.19e-04, Rank=16, Alpha=32




Epoch,Training Loss,Validation Loss,Accuracy
1,1.0303,0.54111,0.8095
2,0.4067,0.366347,0.8865
3,0.2308,0.348784,0.893




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 89.3000%

GENERATION 2/5

[Gen 2, Individual 1/20]
Params: LR=3.06e-04, Rank=4, Alpha=96




Epoch,Training Loss,Validation Loss,Accuracy
1,0.9386,0.500434,0.833
2,0.3769,0.391534,0.8805
3,0.2381,0.35815,0.8875




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 88.7500%

[Gen 2, Individual 2/20]
Params: LR=2.99e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1801,0.8312,0.7105
2,0.681,0.611245,0.774
3,0.538,0.567556,0.7975




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.7500%

[Gen 2, Individual 3/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1655,0.775627,0.709
2,0.6612,0.614963,0.7825
3,0.5367,0.56162,0.8005




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.0500%

[Gen 2, Individual 4/20]
Params: LR=2.96e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.175,0.772562,0.7065
2,0.6497,0.592665,0.7895
3,0.5225,0.552393,0.8035




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.3500%

[Gen 2, Individual 5/20]
Params: LR=2.96e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1746,0.76614,0.712
2,0.6575,0.631608,0.7645
3,0.5358,0.573,0.7965




Accuracy: 79.6500%

[Gen 2, Individual 6/20]
Params: LR=3.01e-04, Rank=2, Alpha=8


Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy
1,1.1857,0.854938,0.6905
2,0.6772,0.644648,0.7655
3,0.5518,0.572701,0.792




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.2000%

[Gen 2, Individual 7/20]
Params: LR=4.25e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1091,0.756965,0.714
2,0.5939,0.539705,0.8085
3,0.4802,0.493826,0.8295




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 82.9500%

[Gen 2, Individual 8/20]
Params: LR=3.05e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1686,0.78691,0.6895
2,0.6523,0.594836,0.7885
3,0.5274,0.547095,0.804




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.4000%

[Gen 2, Individual 9/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1563,0.788699,0.709
2,0.675,0.600679,0.7905
3,0.535,0.558769,0.7985




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.8500%

[Gen 2, Individual 10/20]
Params: LR=1.79e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.2899,0.96573,0.655
2,0.8118,0.735618,0.725
3,0.6648,0.678691,0.7555




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 75.5500%

[Gen 2, Individual 11/20]
Params: LR=2.94e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.2009,0.815273,0.6925
2,0.6651,0.637806,0.7725
3,0.5355,0.569858,0.796




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.6000%

[Gen 2, Individual 12/20]
Params: LR=3.08e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1428,0.783704,0.7135
2,0.6383,0.589026,0.784
3,0.5082,0.547031,0.7995




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.9500%

[Gen 2, Individual 13/20]
Params: LR=2.92e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1514,0.773149,0.7165
2,0.6678,0.602716,0.772
3,0.5259,0.563134,0.797




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.7000%

[Gen 2, Individual 14/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.179,0.802987,0.6985
2,0.6709,0.597746,0.7865
3,0.5403,0.561874,0.796




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.6000%

[Gen 2, Individual 15/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1655,0.772576,0.731
2,0.6497,0.587441,0.7785
3,0.5276,0.54882,0.8015




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.1500%

[Gen 2, Individual 16/20]
Params: LR=3.07e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1519,0.779546,0.7025
2,0.6648,0.595353,0.7835
3,0.5236,0.556288,0.8




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.0000%

[Gen 2, Individual 17/20]
Params: LR=2.51e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.2116,0.835134,0.689
2,0.7014,0.635394,0.766
3,0.575,0.597147,0.782




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 78.2000%

[Gen 2, Individual 18/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1762,0.806583,0.6945
2,0.6711,0.620371,0.7795
3,0.5427,0.570766,0.796




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.6000%

[Gen 2, Individual 19/20]
Params: LR=1.82e-04, Rank=2, Alpha=16




Epoch,Training Loss,Validation Loss,Accuracy
1,1.2015,0.869639,0.6885
2,0.7248,0.653129,0.755
3,0.5984,0.614208,0.7655




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 76.5500%

[Gen 2, Individual 20/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1385,0.769892,0.7215
2,0.6562,0.603399,0.784
3,0.5301,0.560488,0.798




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.8000%

GENERATION 3/5

[Gen 3, Individual 1/20]
Params: LR=3.06e-04, Rank=4, Alpha=96




Epoch,Training Loss,Validation Loss,Accuracy
1,0.9268,0.482645,0.836
2,0.404,0.331934,0.888
3,0.2251,0.310129,0.9055




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 90.5500%
NEW BEST FITNESS: 90.5500%

[Gen 3, Individual 2/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1712,0.800709,0.6995
2,0.6657,0.600167,0.7755
3,0.5462,0.576264,0.7885




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 78.8500%

[Gen 3, Individual 3/20]
Params: LR=3.08e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1717,0.797032,0.693
2,0.6563,0.594115,0.7785
3,0.5324,0.54651,0.8045




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.4500%

[Gen 3, Individual 4/20]
Params: LR=3.03e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1591,0.791209,0.7095
2,0.6694,0.620699,0.7795
3,0.5351,0.554783,0.7985




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.8500%

[Gen 3, Individual 5/20]
Params: LR=3.31e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1554,0.74723,0.713
2,0.6398,0.589353,0.7855
3,0.5029,0.537696,0.811




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 81.1000%

[Gen 3, Individual 6/20]
Params: LR=4.85e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.074,0.675483,0.754
2,0.5679,0.509085,0.821
3,0.4576,0.47562,0.8365




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 83.6500%

[Gen 3, Individual 7/20]
Params: LR=4.45e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.073,0.656091,0.761
2,0.5782,0.521767,0.8145
3,0.4516,0.482424,0.8295




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 82.9500%

[Gen 3, Individual 8/20]
Params: LR=3.78e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.124,0.679694,0.752
2,0.5958,0.549202,0.8055
3,0.4759,0.514354,0.821




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 82.1000%

[Gen 3, Individual 9/20]
Params: LR=3.07e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.176,0.778663,0.7025
2,0.6453,0.602965,0.778
3,0.5458,0.563742,0.7985




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.8500%

[Gen 3, Individual 10/20]
Params: LR=3.07e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1766,0.783933,0.7035
2,0.6612,0.586945,0.7875
3,0.5385,0.548359,0.7995




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.9500%

[Gen 3, Individual 11/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1441,0.760853,0.712
2,0.6501,0.613897,0.7825
3,0.5271,0.556792,0.796




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.6000%

[Gen 3, Individual 12/20]
Params: LR=2.31e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.2188,0.894748,0.6685
2,0.7227,0.649284,0.7645
3,0.6027,0.604559,0.7835




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 78.3500%

[Gen 3, Individual 13/20]
Params: LR=2.67e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1763,0.808068,0.7075
2,0.6765,0.626357,0.7705
3,0.5579,0.580368,0.7875




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 78.7500%

[Gen 3, Individual 14/20]
Params: LR=3.09e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1389,0.784149,0.715
2,0.6436,0.609625,0.7715
3,0.5109,0.550815,0.8075




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.7500%

[Gen 3, Individual 15/20]
Params: LR=3.07e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1551,0.772819,0.7105
2,0.649,0.611874,0.775
3,0.5308,0.566,0.8




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.0000%

[Gen 3, Individual 16/20]
Params: LR=3.34e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1532,0.768832,0.6975
2,0.6539,0.62323,0.776
3,0.5051,0.550617,0.8055




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.5500%

[Gen 3, Individual 17/20]
Params: LR=2.33e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1933,0.861451,0.6895
2,0.7065,0.646043,0.754
3,0.5892,0.605179,0.7835




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 78.3500%

[Gen 3, Individual 18/20]
Params: LR=3.07e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1734,0.802921,0.699
2,0.6711,0.609224,0.7815
3,0.545,0.576866,0.7965




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.6500%

[Gen 3, Individual 19/20]
Params: LR=2.56e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1981,0.811805,0.697
2,0.7026,0.636908,0.762
3,0.5673,0.591606,0.783




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 78.3000%

[Gen 3, Individual 20/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1438,0.740522,0.729
2,0.6378,0.593182,0.7865
3,0.5126,0.54819,0.81




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 81.0000%

GENERATION 4/5

[Gen 4, Individual 1/20]
Params: LR=3.06e-04, Rank=4, Alpha=96




Epoch,Training Loss,Validation Loss,Accuracy
1,0.9696,0.543505,0.818
2,0.3932,0.360344,0.8845
3,0.2301,0.326826,0.903




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 90.3000%

[Gen 4, Individual 2/20]
Params: LR=4.26e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.0925,0.688245,0.749
2,0.601,0.531996,0.811
3,0.4576,0.496238,0.8245




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 82.4500%

[Gen 4, Individual 3/20]
Params: LR=4.80e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.055,0.650426,0.763
2,0.5652,0.536649,0.8085
3,0.4408,0.477617,0.8325




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 83.2500%

[Gen 4, Individual 4/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1487,0.796234,0.7065
2,0.6628,0.600185,0.7755
3,0.5337,0.567451,0.7925




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.2500%

[Gen 4, Individual 5/20]
Params: LR=3.28e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1387,0.756228,0.7105
2,0.6332,0.59134,0.7815
3,0.5088,0.539336,0.805




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.5000%

[Gen 4, Individual 6/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1569,0.767209,0.7075
2,0.6588,0.583448,0.793
3,0.5228,0.542398,0.8055




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.5500%

[Gen 4, Individual 7/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1976,0.802848,0.7045
2,0.6866,0.599702,0.789
3,0.5507,0.565222,0.7955




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.5500%

[Gen 4, Individual 8/20]
Params: LR=4.08e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.0873,0.681398,0.7525
2,0.5835,0.545081,0.808
3,0.4619,0.510246,0.824




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 82.4000%

[Gen 4, Individual 9/20]
Params: LR=5.00e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.0295,0.625769,0.779
2,0.5596,0.512795,0.8165
3,0.4438,0.473309,0.8335




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 83.3500%

[Gen 4, Individual 10/20]
Params: LR=2.83e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1747,0.794383,0.6995
2,0.6651,0.6048,0.788
3,0.5505,0.571433,0.798




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.8000%

[Gen 4, Individual 11/20]
Params: LR=3.36e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1565,0.75889,0.714
2,0.6495,0.60768,0.7785
3,0.5229,0.557923,0.791




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.1000%

[Gen 4, Individual 12/20]
Params: LR=3.06e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1876,0.802924,0.7075
2,0.6794,0.592201,0.7895
3,0.5413,0.562737,0.8005




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.0500%

[Gen 4, Individual 13/20]
Params: LR=3.07e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.172,0.77918,0.715
2,0.6592,0.597445,0.7855
3,0.5334,0.571557,0.798




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.8000%

[Gen 4, Individual 14/20]
Params: LR=4.35e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.0884,0.690012,0.7445
2,0.585,0.541286,0.803
3,0.4722,0.496643,0.825




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 82.5000%

[Gen 4, Individual 15/20]
Params: LR=4.85e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1168,0.753171,0.7215
2,0.5887,0.524454,0.8065
3,0.4397,0.485496,0.8335




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 83.3500%

[Gen 4, Individual 16/20]
Params: LR=3.07e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1445,0.755115,0.7155
2,0.6456,0.567598,0.7925
3,0.5123,0.532457,0.807




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.7000%

[Gen 4, Individual 17/20]
Params: LR=2.87e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1847,0.857325,0.6845
2,0.6848,0.616051,0.7735
3,0.5582,0.581029,0.793




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.3000%

[Gen 4, Individual 18/20]
Params: LR=3.53e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1238,0.737688,0.721
2,0.6207,0.562961,0.8
3,0.5054,0.521109,0.8245




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 82.4500%

[Gen 4, Individual 19/20]
Params: LR=3.61e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1212,0.738993,0.7185
2,0.6113,0.577661,0.7845
3,0.4906,0.510706,0.818




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 81.8000%

[Gen 4, Individual 20/20]
Params: LR=4.02e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1087,0.784752,0.722
2,0.5922,0.557099,0.7955
3,0.4668,0.51184,0.8255




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 82.5500%

GENERATION 5/5

[Gen 5, Individual 1/20]
Params: LR=3.06e-04, Rank=4, Alpha=96




Epoch,Training Loss,Validation Loss,Accuracy
1,0.9519,0.468646,0.843
2,0.3898,0.380323,0.8785
3,0.2297,0.313642,0.903




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 90.3000%

[Gen 5, Individual 2/20]
Params: LR=3.44e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1293,0.732668,0.7335
2,0.6246,0.583032,0.7895
3,0.5115,0.529388,0.8065




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.6500%

[Gen 5, Individual 3/20]
Params: LR=3.56e-04, Rank=4, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1253,0.737563,0.731
2,0.6249,0.572703,0.795
3,0.496,0.525907,0.811




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 81.1000%

[Gen 5, Individual 4/20]
Params: LR=3.45e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1353,0.772402,0.723
2,0.6232,0.551151,0.8095
3,0.4874,0.517577,0.823




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 82.3000%

[Gen 5, Individual 5/20]
Params: LR=3.52e-04, Rank=4, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1524,0.746374,0.7295
2,0.6274,0.581526,0.7935
3,0.5044,0.517643,0.8175




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 81.7500%

[Gen 5, Individual 6/20]
Params: LR=2.69e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.2019,0.842854,0.689
2,0.6996,0.644343,0.7715
3,0.5603,0.592207,0.7845




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 78.4500%

[Gen 5, Individual 7/20]
Params: LR=3.80e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1208,0.719145,0.745
2,0.5959,0.54533,0.808
3,0.4881,0.509239,0.8185




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 81.8500%

[Gen 5, Individual 8/20]
Params: LR=4.80e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.0563,0.64578,0.767
2,0.5697,0.507189,0.8185
3,0.4244,0.4715,0.8345




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 83.4500%

[Gen 5, Individual 9/20]
Params: LR=2.88e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1932,0.807531,0.6905
2,0.669,0.618682,0.7745
3,0.5489,0.573046,0.797




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.7000%

[Gen 5, Individual 10/20]
Params: LR=2.29e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.2432,0.877725,0.68
2,0.7273,0.663528,0.7585
3,0.5779,0.621496,0.771




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 77.1000%

[Gen 5, Individual 11/20]
Params: LR=3.31e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1215,0.76074,0.7105
2,0.6271,0.594982,0.7835
3,0.517,0.541838,0.8045




Accuracy: 80.4500%

[Gen 5, Individual 12/20]
Params: LR=3.87e-04, Rank=2, Alpha=8


Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy
1,1.1197,0.743904,0.7215
2,0.6114,0.57502,0.7985
3,0.4828,0.52249,0.8135




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 81.3500%

[Gen 5, Individual 13/20]
Params: LR=5.00e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.038,0.6399,0.7645
2,0.5597,0.512065,0.8205
3,0.4274,0.466067,0.8485




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 84.8500%

[Gen 5, Individual 14/20]
Params: LR=3.24e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1761,0.783361,0.72
2,0.6447,0.57843,0.7905
3,0.5153,0.54669,0.8015




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 80.1500%

[Gen 5, Individual 15/20]
Params: LR=3.78e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.0823,0.696625,0.7375
2,0.6081,0.573393,0.793
3,0.4733,0.514073,0.8175




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 81.7500%

[Gen 5, Individual 16/20]
Params: LR=2.86e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.19,0.8267,0.6985
2,0.6693,0.614845,0.777
3,0.5446,0.568887,0.796




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.6000%

[Gen 5, Individual 17/20]
Params: LR=5.00e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.0426,0.663387,0.7515
2,0.5487,0.516343,0.816
3,0.4247,0.471637,0.839




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 83.9000%

[Gen 5, Individual 18/20]
Params: LR=5.00e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.0532,0.665463,0.7545
2,0.578,0.534069,0.8095
3,0.4282,0.46941,0.8355




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 83.5500%

[Gen 5, Individual 19/20]
Params: LR=3.12e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.1455,0.771973,0.7
2,0.6357,0.598838,0.78
3,0.5283,0.551852,0.7975




Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Accuracy: 79.7500%

[Gen 5, Individual 20/20]
Params: LR=5.00e-04, Rank=2, Alpha=8




Epoch,Training Loss,Validation Loss,Accuracy
1,1.0434,0.672286,0.754
2,0.5651,0.522602,0.809
3,0.446,0.493934,0.823




Accuracy: 82.3000%

RCGA OPTIMIZATION COMPLETE
Best Fitness: 90.5500%

Results saved to rcga_results.csv

TOP RESULT:
Accuracy: 90.5500%
Generation: 3
Rank: 4, Alpha: 96
LR: 3.06e-04
Warmup: 0.0
Dropout: 0.2
