In [1]:
import torch
from datasets import load_dataset
dataset = load_dataset('tweet_eval','irony')

from transformers import AutoTokenizer, AlbertForSequenceClassification

tokenizer = AutoTokenizer.from_pretrained("textattack/albert-base-v2-imdb",use_fast=False)



In [2]:
dataset


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 2862
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 784
    })
    validation: Dataset({
        features: ['text', 'label'],
        num_rows: 955
    })
})

In [3]:
tokenizer

AlbertTokenizer(name_or_path='textattack/albert-base-v2-imdb', vocab_size=30000, model_max_length=512, is_fast=False, padding_side='right', truncation_side='right', special_tokens={'bos_token': '[CLS]', 'eos_token': '[SEP]', 'unk_token': '<unk>', 'sep_token': '[SEP]', 'pad_token': '<pad>', 'cls_token': '[CLS]', 'mask_token': '[MASK]'}, clean_up_tokenization_spaces=True),  added_tokens_decoder={
	0: AddedToken("<pad>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),
	1: AddedToken("<unk>", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),
	2: AddedToken("[CLS]", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),
	3: AddedToken("[SEP]", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),
	4: AddedToken("[MASK]", rstrip=False, lstrip=True, single_word=False, normalized=False, special=True),
}

In [4]:
def tokenize_function(example):
    return tokenizer(example["text"], padding="max_length", truncation=True)
tokenized_datasets = dataset.map(tokenize_function, batched=True)

In [5]:
tokenized_datasets["train"]

Dataset({
    features: ['text', 'label', 'input_ids', 'token_type_ids', 'attention_mask'],
    num_rows: 2862
})

In [6]:
tokenized_datasets

DatasetDict({
    train: Dataset({
        features: ['text', 'label', 'input_ids', 'token_type_ids', 'attention_mask'],
        num_rows: 2862
    })
    test: Dataset({
        features: ['text', 'label', 'input_ids', 'token_type_ids', 'attention_mask'],
        num_rows: 784
    })
    validation: Dataset({
        features: ['text', 'label', 'input_ids', 'token_type_ids', 'attention_mask'],
        num_rows: 955
    })
})

In [7]:
from transformers import  Trainer, TrainingArguments
import numpy as np
from sklearn.metrics import accuracy_score
model = AlbertForSequenceClassification.from_pretrained("textattack/albert-base-v2-imdb", num_labels=2)
training_args = TrainingArguments(
output_dir="./results",
# Directory for saving outputs
learning_rate=5e-5,
# Learning rate for optimization
per_device_train_batch_size=16,
# Batch size for training
per_device_eval_batch_size=16,
# Batch size for evaluation
num_train_epochs=3,
# Number of training epochs
weight_decay=0.01,
# Weight decay for regularization
evaluation_strategy="epoch",
save_strategy = "no"
# Evaluation is done at the end of each epoch
)
train_dataset = tokenized_datasets["train"]
eval_dataset = tokenized_datasets["test"]
val_dataset = tokenized_datasets["validation"]
trainer = Trainer(
model=model,
args=training_args,
train_dataset=train_dataset,
eval_dataset=eval_dataset,
compute_metrics=lambda p: {"accuracy": accuracy_score(p.label_ids,
np.argmax(p.predictions,
axis=1))}
)

2024-03-09 10:24:01.902706: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
2024-03-09 10:24:01.902752: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
2024-03-09 10:24:01.904352: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered


In [8]:
model

AlbertForSequenceClassification(
  (albert): AlbertModel(
    (embeddings): AlbertEmbeddings(
      (word_embeddings): Embedding(30000, 128, padding_idx=0)
      (position_embeddings): Embedding(512, 128)
      (token_type_embeddings): Embedding(2, 128)
      (LayerNorm): LayerNorm((128,), eps=1e-12, elementwise_affine=True)
      (dropout): Dropout(p=0, inplace=False)
    )
    (encoder): AlbertTransformer(
      (embedding_hidden_mapping_in): Linear(in_features=128, out_features=768, bias=True)
      (albert_layer_groups): ModuleList(
        (0): AlbertLayerGroup(
          (albert_layers): ModuleList(
            (0): AlbertLayer(
              (full_layer_layer_norm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)
              (attention): AlbertAttention(
                (query): Linear(in_features=768, out_features=768, bias=True)
                (key): Linear(in_features=768, out_features=768, bias=True)
                (value): Linear(in_features=768, out_features=768,

In [9]:
import os
os.environ["WANDB_DISABLED"] = "true"

In [10]:
eval_results = trainer.evaluate(eval_dataset)
print(eval_results)

{'eval_loss': 1.3416439294815063, 'eval_accuracy': 0.45535714285714285, 'eval_runtime': 29.9122, 'eval_samples_per_second': 26.21, 'eval_steps_per_second': 1.638}


In [11]:
trainer.train()

Epoch,Training Loss,Validation Loss


KeyboardInterrupt: 

In [10]:
from ray import tune
def ray_hp_space(trial):
    return {
        "learning_rate": tune.loguniform(1e-6, 1e-4),
        "per_device_train_batch_size": tune.choice([1,4 ,8 ]),
        "num_train_epochs": tune.choice([1,3,5]),

        "weight_decay": tune.loguniform(1e-4, 0.1)
    }

In [11]:
small_train_dataset = tokenized_datasets["train"].shard(index=1, num_shards=10) 
small_eval_dataset = tokenized_datasets["test"].shard(index=1, num_shards=10) 


In [12]:
num_labels = 2
from transformers import DistilBertForSequenceClassification, Trainer, TrainingArguments
import numpy as np
from sklearn.metrics import accuracy_score
def model_init():
    return  DistilBertForSequenceClassification.from_pretrained('distilbert-base-uncased',num_labels=num_labels)

In [13]:




num_labels = num_labels
trainer = Trainer(

    model_init= model_init,

    args=training_args,

    train_dataset=small_train_dataset,

    eval_dataset=small_eval_dataset,

    compute_metrics=lambda p: {"accuracy": accuracy_score(p.label_ids,
np.argmax(p.predictions,
axis=1))}

    

  
)

Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


In [14]:
best_trial = trainer.hyperparameter_search(

    direction="maximize",

    backend="ray",

    hp_space=ray_hp_space,

    n_trials=15

)

  self.pid = _fork_exec(
2024-03-07 21:25:09,277	INFO worker.py:1724 -- Started a local Ray instance.
2024-03-07 21:25:10,881	INFO tune.py:220 -- Initializing Ray automatically. For cluster usage or custom Ray initialization, call `ray.init(...)` before `tune.run(...)`.
2024-03-07 21:25:10,884	INFO tune.py:583 -- [output] This uses the legacy output and progress reporter, as Jupyter notebooks are not supported by the new engine, yet. For more information, please see https://github.com/ray-project/ray/issues/36949


== Status ==
Current time: 2024-03-07 21:25:11 (running for 00:00:00.20)
Using FIFO scheduling algorithm.
Logical resource usage: 0/12 CPUs, 0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (15 PENDING)
+------------------------+----------+-------+-----------------+--------------------+------------------------+----------------+
| Trial name             | status   | loc   |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |
|                        |          |       |                 |                    |                ch_size |                |
|------------------------+----------+-------+-----------------+--------------------+------------------------+----------------|
| _objective_d78da_00000 | PENDING  |       |     5.61152e-06 |                  5 |                      1 |    0.015703    |
| _objective_d78da_00001 | PENDING  |       |     1.57513e-05 |                  3

[36m(_objective pid=7911)[0m 2024-03-07 21:25:16.803698: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=7911)[0m 2024-03-07 21:25:16.803751: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=7911)[0m 2024-03-07 21:25:16.805066: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
[36m(_objective pid=7911)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']

== Status ==
Current time: 2024-03-07 21:25:21 (running for 00:00:10.28)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |
|                        |          |                 |                 |                    |                ch_size |                |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |                      1 |    0.015703    |
| _objective_d78d

  1%|          | 11/1435 [00:01<02:01, 11.71it/s]
  1%|          | 13/1435 [00:01<01:56, 12.24it/s]
  1%|          | 15/1435 [00:01<01:53, 12.51it/s]
  1%|          | 17/1435 [00:01<01:51, 12.72it/s]
  1%|▏         | 19/1435 [00:01<01:49, 12.89it/s]
  1%|▏         | 21/1435 [00:01<01:49, 12.95it/s]
  2%|▏         | 23/1435 [00:02<01:49, 12.84it/s]
  2%|▏         | 25/1435 [00:02<01:50, 12.78it/s]
  2%|▏         | 27/1435 [00:02<01:49, 12.87it/s]
  2%|▏         | 29/1435 [00:02<01:47, 13.03it/s]
  2%|▏         | 31/1435 [00:02<01:47, 13.10it/s]
  2%|▏         | 33/1435 [00:02<01:46, 13.16it/s]
  2%|▏         | 35/1435 [00:02<01:46, 13.19it/s]
  3%|▎         | 37/1435 [00:03<01:45, 13.21it/s]
  3%|▎         | 39/1435 [00:03<01:45, 13.21it/s]
  3%|▎         | 41/1435 [00:03<01:45, 13.22it/s]
  3%|▎         | 43/1435 [00:03<01:45, 13.23it/s]
  3%|▎         | 45/1435 [00:03<01:45, 13.23it/s]
  3%|▎         | 47/1435 [00:03<01:44, 13.23it/s]
  3%|▎         | 49/1435 [00:04<01:44, 13.24it/s]


== Status ==
Current time: 2024-03-07 21:25:26 (running for 00:00:15.31)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |
|                        |          |                 |                 |                    |                ch_size |                |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |                      1 |    0.015703    |
| _objective_d78d

  6%|▌         | 79/1435 [00:06<01:43, 13.16it/s]
  6%|▌         | 81/1435 [00:06<01:43, 13.14it/s]
  6%|▌         | 83/1435 [00:06<01:43, 13.06it/s]
  6%|▌         | 85/1435 [00:06<01:42, 13.15it/s]
  6%|▌         | 87/1435 [00:06<01:42, 13.17it/s]
  6%|▌         | 89/1435 [00:07<01:42, 13.15it/s]
  6%|▋         | 91/1435 [00:07<01:41, 13.19it/s]
  6%|▋         | 93/1435 [00:07<01:41, 13.20it/s]
  7%|▋         | 95/1435 [00:07<01:41, 13.17it/s]
  7%|▋         | 97/1435 [00:07<01:42, 13.04it/s]
  7%|▋         | 99/1435 [00:07<01:44, 12.78it/s]
  7%|▋         | 101/1435 [00:07<01:45, 12.69it/s]
  7%|▋         | 103/1435 [00:08<01:44, 12.73it/s]
  7%|▋         | 105/1435 [00:08<01:43, 12.85it/s]
  7%|▋         | 107/1435 [00:08<01:42, 12.90it/s]
  8%|▊         | 109/1435 [00:08<01:42, 12.97it/s]
  8%|▊         | 111/1435 [00:08<01:41, 13.07it/s]
  8%|▊         | 113/1435 [00:08<01:41, 13.07it/s]
  8%|▊         | 115/1435 [00:09<01:40, 13.07it/s]
  8%|▊         | 117/1435 [00:09<01:40, 13

== Status ==
Current time: 2024-03-07 21:25:31 (running for 00:00:20.35)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |
|                        |          |                 |                 |                    |                ch_size |                |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |                      1 |    0.015703    |
| _objective_d78d

 10%|█         | 145/1435 [00:11<01:34, 13.58it/s]
 10%|█         | 147/1435 [00:11<01:34, 13.64it/s]
 10%|█         | 149/1435 [00:11<01:34, 13.61it/s]
 11%|█         | 151/1435 [00:11<01:34, 13.63it/s]
 11%|█         | 153/1435 [00:11<01:34, 13.56it/s]
 11%|█         | 155/1435 [00:12<01:34, 13.58it/s]
 11%|█         | 157/1435 [00:12<01:33, 13.66it/s]
 11%|█         | 159/1435 [00:12<01:33, 13.58it/s]
 11%|█         | 161/1435 [00:12<01:33, 13.60it/s]
 11%|█▏        | 163/1435 [00:12<01:33, 13.58it/s]
 11%|█▏        | 165/1435 [00:12<01:32, 13.66it/s]
 12%|█▏        | 167/1435 [00:12<01:32, 13.73it/s]
 12%|█▏        | 169/1435 [00:13<01:32, 13.70it/s]
 12%|█▏        | 171/1435 [00:13<01:32, 13.66it/s]
 12%|█▏        | 173/1435 [00:13<01:32, 13.71it/s]
 12%|█▏        | 175/1435 [00:13<01:32, 13.64it/s]
 12%|█▏        | 177/1435 [00:13<01:31, 13.71it/s]
 12%|█▏        | 179/1435 [00:13<01:31, 13.73it/s]
 13%|█▎        | 181/1435 [00:13<01:31, 13.64it/s]
 13%|█▎        | 183/1435 [00:1

== Status ==
Current time: 2024-03-07 21:25:36 (running for 00:00:25.39)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |
|                        |          |                 |                 |                    |                ch_size |                |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |                      1 |    0.015703    |
| _objective_d78d

 15%|█▍        | 213/1435 [00:16<01:29, 13.62it/s]
 15%|█▍        | 215/1435 [00:16<01:29, 13.70it/s]
 15%|█▌        | 217/1435 [00:16<01:29, 13.68it/s]
 15%|█▌        | 219/1435 [00:16<01:28, 13.73it/s]
 15%|█▌        | 221/1435 [00:16<01:28, 13.65it/s]
 16%|█▌        | 223/1435 [00:17<01:29, 13.60it/s]
 16%|█▌        | 225/1435 [00:17<01:28, 13.64it/s]
 16%|█▌        | 227/1435 [00:17<01:27, 13.73it/s]
 16%|█▌        | 229/1435 [00:17<01:27, 13.77it/s]
 16%|█▌        | 231/1435 [00:17<01:27, 13.82it/s]
 16%|█▌        | 233/1435 [00:17<01:27, 13.67it/s]
 16%|█▋        | 235/1435 [00:17<01:28, 13.56it/s]
 17%|█▋        | 237/1435 [00:18<01:28, 13.59it/s]
 17%|█▋        | 239/1435 [00:18<01:27, 13.68it/s]
 17%|█▋        | 241/1435 [00:18<01:26, 13.74it/s]
 17%|█▋        | 243/1435 [00:18<01:26, 13.71it/s]
 17%|█▋        | 245/1435 [00:18<01:26, 13.73it/s]
 17%|█▋        | 247/1435 [00:18<01:27, 13.65it/s]
 17%|█▋        | 249/1435 [00:18<01:26, 13.68it/s]
 17%|█▋        | 251/1435 [00:1

== Status ==
Current time: 2024-03-07 21:25:41 (running for 00:00:30.43)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |
|                        |          |                 |                 |                    |                ch_size |                |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |                      1 |    0.015703    |
| _objective_d78d

 20%|█▉        | 283/1435 [00:21<01:24, 13.63it/s]
 20%|█▉        | 285/1435 [00:21<01:24, 13.67it/s]
 20%|██        | 287/1435 [00:21<01:23, 13.69it/s]
[36m(_objective pid=7911)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=7911)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.53it/s][A
[36m(_objective pid=7911)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.24it/s][A
[36m(_objective pid=7911)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.37it/s][A


Trial name,epoch,eval_accuracy,eval_loss,eval_runtime,eval_samples_per_second,eval_steps_per_second,objective
_objective_d78da_00000,5,0.594937,0.851065,1.3529,58.392,3.696,0.594937
_objective_d78da_00001,3,0.658228,0.638323,1.3484,58.587,3.708,0.658228
_objective_d78da_00002,5,0.582278,0.68181,1.3609,58.051,3.674,0.582278
_objective_d78da_00003,3,0.658228,0.665614,1.3564,58.241,3.686,0.658228
_objective_d78da_00004,3,0.417722,0.729034,1.2957,60.973,3.859,0.417722
_objective_d78da_00005,5,0.64557,0.978692,1.3023,60.664,3.839,0.64557
_objective_d78da_00006,3,0.556962,0.691389,1.304,60.585,3.834,0.556962
_objective_d78da_00007,1,0.594937,0.686077,1.2951,60.998,3.861,0.594937
_objective_d78da_00008,1,0.594937,0.676401,1.307,60.444,3.826,0.594937
_objective_d78da_00009,3,0.582278,0.6885,1.2959,60.962,3.858,0.582278


[36m(_objective pid=7911)[0m 
                                                  
 20%|██        | 287/1435 [00:23<01:23, 13.69it/s]
100%|██████████| 5/5 [00:01<00:00,  4.23it/s][A
                                             [A
 20%|██        | 289/1435 [00:23<05:19,  3.58it/s]


[36m(_objective pid=7911)[0m {'eval_loss': 0.6991307735443115, 'eval_accuracy': 0.45569620253164556, 'eval_runtime': 1.3655, 'eval_samples_per_second': 57.855, 'eval_steps_per_second': 3.662, 'epoch': 1.0}


 20%|██        | 291/1435 [00:23<04:09,  4.58it/s]
 20%|██        | 293/1435 [00:23<03:20,  5.69it/s]
 21%|██        | 295/1435 [00:23<02:46,  6.84it/s]
 21%|██        | 297/1435 [00:23<02:22,  7.96it/s]
 21%|██        | 299/1435 [00:24<02:05,  9.03it/s]
 21%|██        | 301/1435 [00:24<01:54,  9.91it/s]
 21%|██        | 303/1435 [00:24<01:45, 10.70it/s]
 21%|██▏       | 305/1435 [00:24<01:39, 11.33it/s]
 21%|██▏       | 307/1435 [00:24<01:34, 11.93it/s]
 22%|██▏       | 309/1435 [00:24<01:31, 12.29it/s]
 22%|██▏       | 311/1435 [00:24<01:29, 12.55it/s]
 22%|██▏       | 313/1435 [00:25<01:27, 12.81it/s]
 22%|██▏       | 315/1435 [00:25<01:26, 12.93it/s]
 22%|██▏       | 317/1435 [00:25<01:26, 12.91it/s]
 22%|██▏       | 319/1435 [00:25<01:26, 12.87it/s]
 22%|██▏       | 321/1435 [00:25<01:26, 12.85it/s]
 23%|██▎       | 323/1435 [00:25<01:26, 12.88it/s]
 23%|██▎       | 325/1435 [00:26<01:25, 12.91it/s]
 23%|██▎       | 327/1435 [00:26<01:26, 12.88it/s]


== Status ==
Current time: 2024-03-07 21:25:46 (running for 00:00:35.49)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 23%|██▎       | 329/1435 [00:26<01:25, 12.88it/s]
 23%|██▎       | 331/1435 [00:26<01:24, 13.02it/s]
 23%|██▎       | 333/1435 [00:26<01:23, 13.22it/s]
 23%|██▎       | 335/1435 [00:26<01:23, 13.15it/s]
 23%|██▎       | 337/1435 [00:26<01:23, 13.12it/s]
 24%|██▎       | 339/1435 [00:27<01:23, 13.07it/s]
 24%|██▍       | 341/1435 [00:27<01:23, 13.09it/s]
 24%|██▍       | 343/1435 [00:27<01:23, 13.13it/s]
 24%|██▍       | 345/1435 [00:27<01:23, 13.07it/s]
 24%|██▍       | 347/1435 [00:27<01:23, 13.05it/s]
 24%|██▍       | 349/1435 [00:27<01:22, 13.20it/s]
 24%|██▍       | 351/1435 [00:27<01:21, 13.31it/s]
 25%|██▍       | 353/1435 [00:28<01:22, 13.14it/s]
 25%|██▍       | 355/1435 [00:28<01:22, 13.07it/s]
 25%|██▍       | 357/1435 [00:28<01:22, 13.08it/s]
 25%|██▌       | 359/1435 [00:28<01:22, 13.11it/s]
 25%|██▌       | 361/1435 [00:28<01:21, 13.13it/s]
 25%|██▌       | 363/1435 [00:28<01:20, 13.29it/s]
 25%|██▌       | 365/1435 [00:29<01:20, 13.28it/s]
 26%|██▌       | 367/1435 [00:2

== Status ==
Current time: 2024-03-07 21:25:51 (running for 00:00:40.53)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 28%|██▊       | 399/1435 [00:31<01:15, 13.79it/s]
 28%|██▊       | 401/1435 [00:31<01:15, 13.62it/s]
 28%|██▊       | 403/1435 [00:31<01:15, 13.70it/s]
 28%|██▊       | 405/1435 [00:31<01:15, 13.68it/s]
 28%|██▊       | 407/1435 [00:32<01:15, 13.62it/s]
 29%|██▊       | 409/1435 [00:32<01:15, 13.68it/s]
 29%|██▊       | 411/1435 [00:32<01:14, 13.75it/s]
 29%|██▉       | 413/1435 [00:32<01:13, 13.81it/s]
 29%|██▉       | 415/1435 [00:32<01:13, 13.79it/s]
 29%|██▉       | 417/1435 [00:32<01:14, 13.73it/s]
 29%|██▉       | 419/1435 [00:32<01:14, 13.63it/s]
 29%|██▉       | 421/1435 [00:33<01:15, 13.44it/s]
 29%|██▉       | 423/1435 [00:33<01:16, 13.28it/s]
 30%|██▉       | 425/1435 [00:33<01:16, 13.25it/s]
 30%|██▉       | 427/1435 [00:33<01:16, 13.13it/s]
 30%|██▉       | 429/1435 [00:33<01:16, 13.09it/s]
 30%|███       | 431/1435 [00:33<01:16, 13.11it/s]
 30%|███       | 433/1435 [00:34<01:16, 13.13it/s]
 30%|███       | 435/1435 [00:34<01:16, 13.09it/s]
 30%|███       | 437/1435 [00:3

== Status ==
Current time: 2024-03-07 21:25:56 (running for 00:00:45.57)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 33%|███▎      | 467/1435 [00:36<01:13, 13.14it/s]
 33%|███▎      | 469/1435 [00:36<01:13, 13.16it/s]
 33%|███▎      | 471/1435 [00:36<01:13, 13.16it/s]
 33%|███▎      | 473/1435 [00:37<01:12, 13.19it/s]
 33%|███▎      | 475/1435 [00:37<01:13, 13.15it/s]
 33%|███▎      | 477/1435 [00:37<01:12, 13.18it/s]
 33%|███▎      | 479/1435 [00:37<01:12, 13.20it/s]
 34%|███▎      | 481/1435 [00:37<01:12, 13.20it/s]
 34%|███▎      | 483/1435 [00:37<01:11, 13.24it/s]
 34%|███▍      | 485/1435 [00:38<01:11, 13.22it/s]
 34%|███▍      | 487/1435 [00:38<01:11, 13.22it/s]
 34%|███▍      | 489/1435 [00:38<01:11, 13.22it/s]
 34%|███▍      | 491/1435 [00:38<01:11, 13.21it/s]
 34%|███▍      | 493/1435 [00:38<01:11, 13.21it/s]
 34%|███▍      | 495/1435 [00:38<01:11, 13.20it/s]
 35%|███▍      | 497/1435 [00:38<01:10, 13.22it/s]
 35%|███▍      | 499/1435 [00:39<01:10, 13.19it/s]
 35%|███▍      | 500/1435 [00:39<01:10, 13.19it/s]


[36m(_objective pid=7911)[0m {'loss': 0.7286, 'grad_norm': 23.829519271850586, 'learning_rate': 3.6562842148695235e-06, 'epoch': 1.74}


 35%|███▍      | 501/1435 [00:40<05:00,  3.11it/s]
 35%|███▌      | 503/1435 [00:41<03:50,  4.04it/s]
 35%|███▌      | 505/1435 [00:41<03:02,  5.10it/s]
 35%|███▌      | 507/1435 [00:41<02:28,  6.26it/s]


== Status ==
Current time: 2024-03-07 21:26:01 (running for 00:00:50.61)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 35%|███▌      | 509/1435 [00:41<02:04,  7.43it/s]
 36%|███▌      | 511/1435 [00:41<01:47,  8.57it/s]
 36%|███▌      | 513/1435 [00:41<01:36,  9.54it/s]
 36%|███▌      | 515/1435 [00:41<01:28, 10.43it/s]
 36%|███▌      | 517/1435 [00:42<01:22, 11.15it/s]
 36%|███▌      | 519/1435 [00:42<01:18, 11.68it/s]
 36%|███▋      | 521/1435 [00:42<01:15, 12.13it/s]
 36%|███▋      | 523/1435 [00:42<01:13, 12.48it/s]
 37%|███▋      | 525/1435 [00:42<01:11, 12.70it/s]
 37%|███▋      | 527/1435 [00:42<01:10, 12.81it/s]
 37%|███▋      | 529/1435 [00:42<01:10, 12.93it/s]
 37%|███▋      | 531/1435 [00:43<01:09, 12.99it/s]
 37%|███▋      | 533/1435 [00:43<01:09, 13.01it/s]
 37%|███▋      | 535/1435 [00:43<01:08, 13.11it/s]
 37%|███▋      | 537/1435 [00:43<01:08, 13.18it/s]
 38%|███▊      | 539/1435 [00:43<01:08, 13.13it/s]
 38%|███▊      | 541/1435 [00:43<01:07, 13.17it/s]
 38%|███▊      | 543/1435 [00:44<01:07, 13.14it/s]
 38%|███▊      | 545/1435 [00:44<01:07, 13.12it/s]
 38%|███▊      | 547/1435 [00:4

== Status ==
Current time: 2024-03-07 21:26:06 (running for 00:00:55.65)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

[36m(_objective pid=7911)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=7911)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.26it/s][A
[36m(_objective pid=7911)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.13it/s][A
[36m(_objective pid=7911)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.44it/s][A
[36m(_objective pid=7911)[0m 
                                                  
 40%|████      | 574/1435 [00:47<01:05, 13.16it/s]
100%|██████████| 5/5 [00:01<00:00,  4.26it/s][A
                                             [A
 40%|████      | 575/1435 [00:47<04:00,  3.57it/s]


[36m(_objective pid=7911)[0m {'eval_loss': 0.6752414703369141, 'eval_accuracy': 0.569620253164557, 'eval_runtime': 1.3655, 'eval_samples_per_second': 57.853, 'eval_steps_per_second': 3.662, 'epoch': 2.0}


 40%|████      | 577/1435 [00:47<03:08,  4.56it/s]
 40%|████      | 579/1435 [00:48<02:30,  5.67it/s]
 40%|████      | 581/1435 [00:48<02:04,  6.84it/s]
 41%|████      | 583/1435 [00:48<01:46,  8.01it/s]
 41%|████      | 585/1435 [00:48<01:33,  9.07it/s]
 41%|████      | 587/1435 [00:48<01:24, 10.02it/s]
 41%|████      | 589/1435 [00:48<01:18, 10.77it/s]
 41%|████      | 591/1435 [00:49<01:14, 11.40it/s]
 41%|████▏     | 593/1435 [00:49<01:10, 11.90it/s]
 41%|████▏     | 595/1435 [00:49<01:08, 12.29it/s]
 42%|████▏     | 597/1435 [00:49<01:06, 12.56it/s]
 42%|████▏     | 599/1435 [00:49<01:05, 12.77it/s]
 42%|████▏     | 601/1435 [00:49<01:04, 12.89it/s]
 42%|████▏     | 603/1435 [00:49<01:03, 13.00it/s]
 42%|████▏     | 605/1435 [00:50<01:03, 13.09it/s]
 42%|████▏     | 607/1435 [00:50<01:03, 13.11it/s]
 42%|████▏     | 609/1435 [00:50<01:02, 13.14it/s]
 43%|████▎     | 611/1435 [00:50<01:02, 13.16it/s]
 43%|████▎     | 613/1435 [00:50<01:02, 13.21it/s]
 43%|████▎     | 615/1435 [00:5

== Status ==
Current time: 2024-03-07 21:26:12 (running for 00:01:01.15)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 44%|████▍     | 629/1435 [00:51<01:00, 13.22it/s]
 44%|████▍     | 631/1435 [00:52<01:00, 13.21it/s]
 44%|████▍     | 633/1435 [00:52<01:00, 13.24it/s]
 44%|████▍     | 635/1435 [00:52<01:00, 13.22it/s]
 44%|████▍     | 637/1435 [00:52<01:00, 13.23it/s]
 45%|████▍     | 639/1435 [00:52<01:00, 13.23it/s]
 45%|████▍     | 641/1435 [00:52<01:00, 13.21it/s]
 45%|████▍     | 643/1435 [00:52<00:59, 13.23it/s]
 45%|████▍     | 645/1435 [00:53<00:59, 13.20it/s]
 45%|████▌     | 647/1435 [00:53<00:59, 13.19it/s]
 45%|████▌     | 649/1435 [00:53<00:59, 13.21it/s]
 45%|████▌     | 651/1435 [00:53<00:59, 13.23it/s]
 46%|████▌     | 653/1435 [00:53<00:58, 13.27it/s]
 46%|████▌     | 655/1435 [00:53<00:58, 13.23it/s]
 46%|████▌     | 657/1435 [00:54<00:58, 13.21it/s]
 46%|████▌     | 659/1435 [00:54<00:58, 13.19it/s]
 46%|████▌     | 661/1435 [00:54<00:58, 13.15it/s]
 46%|████▌     | 663/1435 [00:54<00:58, 13.16it/s]
 46%|████▋     | 665/1435 [00:54<00:58, 13.18it/s]
 46%|████▋     | 667/1435 [00:5

== Status ==
Current time: 2024-03-07 21:26:17 (running for 00:01:06.19)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 49%|████▊     | 697/1435 [00:57<00:56, 13.15it/s]
 49%|████▊     | 699/1435 [00:57<00:55, 13.16it/s]
 49%|████▉     | 701/1435 [00:57<00:55, 13.17it/s]
 49%|████▉     | 703/1435 [00:57<00:55, 13.17it/s]
 49%|████▉     | 705/1435 [00:57<00:55, 13.15it/s]
 49%|████▉     | 707/1435 [00:57<00:55, 13.12it/s]
 49%|████▉     | 709/1435 [00:57<00:55, 13.12it/s]
 50%|████▉     | 711/1435 [00:58<00:55, 13.16it/s]
 50%|████▉     | 713/1435 [00:58<00:54, 13.15it/s]
 50%|████▉     | 715/1435 [00:58<00:54, 13.16it/s]
 50%|████▉     | 717/1435 [00:58<00:54, 13.17it/s]
 50%|█████     | 719/1435 [00:58<00:54, 13.19it/s]
 50%|█████     | 721/1435 [00:58<00:54, 13.17it/s]
 50%|█████     | 723/1435 [00:59<00:54, 13.17it/s]
 51%|█████     | 725/1435 [00:59<00:53, 13.21it/s]
 51%|█████     | 727/1435 [00:59<00:53, 13.26it/s]
 51%|█████     | 729/1435 [00:59<00:53, 13.28it/s]
 51%|█████     | 731/1435 [00:59<00:53, 13.28it/s]
 51%|█████     | 733/1435 [00:59<00:52, 13.28it/s]
 51%|█████     | 735/1435 [00:5

== Status ==
Current time: 2024-03-07 21:26:22 (running for 00:01:11.24)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 53%|█████▎    | 765/1435 [01:02<00:50, 13.23it/s]
 53%|█████▎    | 767/1435 [01:02<00:50, 13.23it/s]
 54%|█████▎    | 769/1435 [01:02<00:50, 13.19it/s]
 54%|█████▎    | 771/1435 [01:02<00:50, 13.22it/s]
 54%|█████▍    | 773/1435 [01:02<00:50, 13.23it/s]
 54%|█████▍    | 775/1435 [01:02<00:49, 13.20it/s]
 54%|█████▍    | 777/1435 [01:03<00:49, 13.24it/s]
 54%|█████▍    | 779/1435 [01:03<00:49, 13.25it/s]
 54%|█████▍    | 781/1435 [01:03<00:49, 13.26it/s]
 55%|█████▍    | 783/1435 [01:03<00:49, 13.24it/s]
 55%|█████▍    | 785/1435 [01:03<00:48, 13.29it/s]
 55%|█████▍    | 787/1435 [01:03<00:48, 13.30it/s]
 55%|█████▍    | 789/1435 [01:04<00:48, 13.28it/s]
 55%|█████▌    | 791/1435 [01:04<00:48, 13.29it/s]
 55%|█████▌    | 793/1435 [01:04<00:48, 13.30it/s]
 55%|█████▌    | 795/1435 [01:04<00:47, 13.33it/s]
 56%|█████▌    | 797/1435 [01:04<00:47, 13.33it/s]
 56%|█████▌    | 799/1435 [01:04<00:47, 13.32it/s]
 56%|█████▌    | 801/1435 [01:04<00:47, 13.34it/s]
 56%|█████▌    | 803/1435 [01:0

== Status ==
Current time: 2024-03-07 21:26:27 (running for 00:01:16.27)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 58%|█████▊    | 833/1435 [01:07<00:45, 13.30it/s]
 58%|█████▊    | 835/1435 [01:07<00:45, 13.31it/s]
 58%|█████▊    | 837/1435 [01:07<00:45, 13.24it/s]
 58%|█████▊    | 839/1435 [01:07<00:45, 13.24it/s]
 59%|█████▊    | 841/1435 [01:07<00:44, 13.26it/s]
 59%|█████▊    | 843/1435 [01:08<00:44, 13.24it/s]
 59%|█████▉    | 845/1435 [01:08<00:44, 13.16it/s]
 59%|█████▉    | 847/1435 [01:08<00:44, 13.20it/s]
 59%|█████▉    | 849/1435 [01:08<00:44, 13.21it/s]
 59%|█████▉    | 851/1435 [01:08<00:44, 13.26it/s]
 59%|█████▉    | 853/1435 [01:08<00:43, 13.26it/s]
 60%|█████▉    | 855/1435 [01:08<00:43, 13.23it/s]
 60%|█████▉    | 857/1435 [01:09<00:43, 13.26it/s]
 60%|█████▉    | 859/1435 [01:09<00:43, 13.16it/s]
 60%|██████    | 861/1435 [01:09<00:43, 13.22it/s]
[36m(_objective pid=7911)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=7911)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.27it/s][A
[36m(_objective pid=7911)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.14it/s][A


[36m(_objective pid=7911)[0m {'eval_loss': 0.6709446907043457, 'eval_accuracy': 0.5822784810126582, 'eval_runtime': 1.3585, 'eval_samples_per_second': 58.154, 'eval_steps_per_second': 3.681, 'epoch': 3.0}


 60%|██████    | 865/1435 [01:11<02:04,  4.57it/s]
 60%|██████    | 867/1435 [01:11<01:39,  5.68it/s]
 61%|██████    | 869/1435 [01:11<01:22,  6.86it/s]
 61%|██████    | 871/1435 [01:11<01:10,  8.00it/s]
 61%|██████    | 873/1435 [01:11<01:01,  9.09it/s]
 61%|██████    | 875/1435 [01:11<00:55, 10.04it/s]
 61%|██████    | 877/1435 [01:12<00:51, 10.83it/s]
 61%|██████▏   | 879/1435 [01:12<00:48, 11.42it/s]


== Status ==
Current time: 2024-03-07 21:26:32 (running for 00:01:21.37)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 61%|██████▏   | 881/1435 [01:12<00:46, 11.92it/s]
 62%|██████▏   | 883/1435 [01:12<00:44, 12.30it/s]
 62%|██████▏   | 885/1435 [01:12<00:43, 12.59it/s]
 62%|██████▏   | 887/1435 [01:12<00:42, 12.76it/s]
 62%|██████▏   | 889/1435 [01:12<00:42, 12.93it/s]
 62%|██████▏   | 891/1435 [01:13<00:41, 13.02it/s]
 62%|██████▏   | 893/1435 [01:13<00:41, 13.10it/s]
 62%|██████▏   | 895/1435 [01:13<00:41, 13.16it/s]
 63%|██████▎   | 897/1435 [01:13<00:40, 13.21it/s]
 63%|██████▎   | 899/1435 [01:13<00:40, 13.24it/s]
 63%|██████▎   | 901/1435 [01:13<00:40, 13.23it/s]
 63%|██████▎   | 903/1435 [01:13<00:40, 13.24it/s]
 63%|██████▎   | 905/1435 [01:14<00:40, 13.21it/s]
 63%|██████▎   | 907/1435 [01:14<00:39, 13.22it/s]
 63%|██████▎   | 909/1435 [01:14<00:39, 13.26it/s]
 63%|██████▎   | 911/1435 [01:14<00:39, 13.25it/s]
 64%|██████▎   | 913/1435 [01:14<00:39, 13.25it/s]
 64%|██████▍   | 915/1435 [01:14<00:39, 13.28it/s]
 64%|██████▍   | 917/1435 [01:15<00:39, 13.22it/s]
 64%|██████▍   | 919/1435 [01:1

== Status ==
Current time: 2024-03-07 21:26:37 (running for 00:01:26.42)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 66%|██████▌   | 947/1435 [01:17<00:36, 13.22it/s]
 66%|██████▌   | 949/1435 [01:17<00:36, 13.22it/s]
 66%|██████▋   | 951/1435 [01:17<00:36, 13.23it/s]
 66%|██████▋   | 953/1435 [01:17<00:36, 13.26it/s]
 67%|██████▋   | 955/1435 [01:17<00:36, 13.28it/s]
 67%|██████▋   | 957/1435 [01:18<00:35, 13.28it/s]
 67%|██████▋   | 959/1435 [01:18<00:35, 13.25it/s]
 67%|██████▋   | 961/1435 [01:18<00:35, 13.29it/s]
 67%|██████▋   | 963/1435 [01:18<00:35, 13.26it/s]
 67%|██████▋   | 965/1435 [01:18<00:35, 13.26it/s]
 67%|██████▋   | 967/1435 [01:18<00:35, 13.30it/s]
 68%|██████▊   | 969/1435 [01:18<00:35, 13.29it/s]
 68%|██████▊   | 971/1435 [01:19<00:34, 13.28it/s]
 68%|██████▊   | 973/1435 [01:19<00:34, 13.23it/s]
 68%|██████▊   | 975/1435 [01:19<00:34, 13.24it/s]
 68%|██████▊   | 977/1435 [01:19<00:34, 13.23it/s]
 68%|██████▊   | 979/1435 [01:19<00:34, 13.21it/s]
 68%|██████▊   | 981/1435 [01:19<00:34, 13.28it/s]
 69%|██████▊   | 983/1435 [01:20<00:34, 13.27it/s]
 69%|██████▊   | 985/1435 [01:2

[36m(_objective pid=7911)[0m {'loss': 0.6371, 'grad_norm': 31.128156661987305, 'learning_rate': 1.7010520144045377e-06, 'epoch': 3.48}
== Status ==
Current time: 2024-03-07 21:26:42 (running for 00:01:31.47)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------

 70%|██████▉   | 1001/1435 [01:22<02:16,  3.17it/s]
 70%|██████▉   | 1003/1435 [01:23<01:45,  4.11it/s]
 70%|███████   | 1005/1435 [01:23<01:23,  5.18it/s]
 70%|███████   | 1007/1435 [01:23<01:07,  6.34it/s]
 70%|███████   | 1009/1435 [01:23<00:56,  7.52it/s]
 70%|███████   | 1011/1435 [01:23<00:48,  8.65it/s]
 71%|███████   | 1013/1435 [01:23<00:43,  9.68it/s]
 71%|███████   | 1015/1435 [01:24<00:39, 10.55it/s]
 71%|███████   | 1017/1435 [01:24<00:37, 11.22it/s]
 71%|███████   | 1019/1435 [01:24<00:35, 11.77it/s]
 71%|███████   | 1021/1435 [01:24<00:33, 12.22it/s]
 71%|███████▏  | 1023/1435 [01:24<00:32, 12.50it/s]
 71%|███████▏  | 1025/1435 [01:24<00:32, 12.62it/s]
 72%|███████▏  | 1027/1435 [01:24<00:31, 12.87it/s]
 72%|███████▏  | 1029/1435 [01:25<00:31, 13.02it/s]
 72%|███████▏  | 1031/1435 [01:25<00:31, 13.02it/s]
 72%|███████▏  | 1033/1435 [01:25<00:30, 13.09it/s]
 72%|███████▏  | 1035/1435 [01:25<00:30, 13.17it/s]
 72%|███████▏  | 1037/1435 [01:25<00:30, 13.26it/s]
 72%|███████

== Status ==
Current time: 2024-03-07 21:26:47 (running for 00:01:36.51)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 74%|███████▍  | 1059/1435 [01:27<00:28, 13.31it/s]
 74%|███████▍  | 1061/1435 [01:27<00:27, 13.36it/s]
 74%|███████▍  | 1063/1435 [01:27<00:27, 13.31it/s]
 74%|███████▍  | 1065/1435 [01:27<00:27, 13.33it/s]
 74%|███████▍  | 1067/1435 [01:27<00:27, 13.33it/s]
 74%|███████▍  | 1069/1435 [01:28<00:27, 13.34it/s]
 75%|███████▍  | 1071/1435 [01:28<00:27, 13.28it/s]
 75%|███████▍  | 1073/1435 [01:28<00:27, 13.31it/s]
 75%|███████▍  | 1075/1435 [01:28<00:27, 13.33it/s]
 75%|███████▌  | 1077/1435 [01:28<00:26, 13.33it/s]
 75%|███████▌  | 1079/1435 [01:28<00:26, 13.35it/s]
 75%|███████▌  | 1081/1435 [01:28<00:26, 13.26it/s]
 75%|███████▌  | 1083/1435 [01:29<00:26, 13.28it/s]
 76%|███████▌  | 1085/1435 [01:29<00:26, 13.24it/s]
 76%|███████▌  | 1087/1435 [01:29<00:26, 13.29it/s]
 76%|███████▌  | 1089/1435 [01:29<00:26, 13.27it/s]
 76%|███████▌  | 1091/1435 [01:29<00:25, 13.29it/s]
 76%|███████▌  | 1093/1435 [01:29<00:25, 13.28it/s]
 76%|███████▋  | 1095/1435 [01:30<00:25, 13.28it/s]
 76%|███████

== Status ==
Current time: 2024-03-07 21:26:52 (running for 00:01:41.55)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 79%|███████▊  | 1129/1435 [01:32<00:23, 13.29it/s]
 79%|███████▉  | 1131/1435 [01:32<00:22, 13.33it/s]
 79%|███████▉  | 1133/1435 [01:32<00:22, 13.31it/s]
 79%|███████▉  | 1135/1435 [01:33<00:22, 13.30it/s]
 79%|███████▉  | 1137/1435 [01:33<00:22, 13.33it/s]
 79%|███████▉  | 1139/1435 [01:33<00:22, 13.29it/s]
 80%|███████▉  | 1141/1435 [01:33<00:22, 13.33it/s]
 80%|███████▉  | 1143/1435 [01:33<00:21, 13.32it/s]
 80%|███████▉  | 1145/1435 [01:33<00:22, 13.13it/s]
 80%|███████▉  | 1147/1435 [01:33<00:21, 13.14it/s]
[36m(_objective pid=7911)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=7911)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.32it/s][A
[36m(_objective pid=7911)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.14it/s][A
[36m(_objective pid=7911)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.45it/s][A
[36m(_objective pid=7911)[0m 
                                                   
 80%|████████  | 1148/1435 [01:35<00:21, 13.14it/s]
100%|██████████| 5/5 [00:01<

[36m(_objective pid=7911)[0m {'eval_loss': 0.783547043800354, 'eval_accuracy': 0.6075949367088608, 'eval_runtime': 1.366, 'eval_samples_per_second': 57.833, 'eval_steps_per_second': 3.66, 'epoch': 4.0}


 80%|████████  | 1151/1435 [01:35<01:02,  4.54it/s]
 80%|████████  | 1153/1435 [01:35<00:49,  5.66it/s]
 80%|████████  | 1155/1435 [01:35<00:41,  6.82it/s]
 81%|████████  | 1157/1435 [01:36<00:34,  7.95it/s]
 81%|████████  | 1159/1435 [01:36<00:30,  9.02it/s]
 81%|████████  | 1161/1435 [01:36<00:27,  9.97it/s]
 81%|████████  | 1163/1435 [01:36<00:25, 10.79it/s]
 81%|████████  | 1165/1435 [01:36<00:23, 11.46it/s]
 81%|████████▏ | 1167/1435 [01:36<00:22, 11.91it/s]
 81%|████████▏ | 1169/1435 [01:37<00:21, 12.31it/s]
 82%|████████▏ | 1171/1435 [01:37<00:20, 12.57it/s]
 82%|████████▏ | 1173/1435 [01:37<00:20, 12.77it/s]


== Status ==
Current time: 2024-03-07 21:26:57 (running for 00:01:46.59)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 82%|████████▏ | 1175/1435 [01:37<00:20, 12.92it/s]
 82%|████████▏ | 1177/1435 [01:37<00:19, 13.02it/s]
 82%|████████▏ | 1179/1435 [01:37<00:19, 13.16it/s]
 82%|████████▏ | 1181/1435 [01:37<00:19, 13.22it/s]
 82%|████████▏ | 1183/1435 [01:38<00:19, 13.21it/s]
 83%|████████▎ | 1185/1435 [01:38<00:18, 13.26it/s]
 83%|████████▎ | 1187/1435 [01:38<00:18, 13.26it/s]
 83%|████████▎ | 1189/1435 [01:38<00:18, 13.31it/s]
 83%|████████▎ | 1191/1435 [01:38<00:18, 13.31it/s]
 83%|████████▎ | 1193/1435 [01:38<00:18, 13.35it/s]
 83%|████████▎ | 1195/1435 [01:38<00:17, 13.35it/s]
 83%|████████▎ | 1197/1435 [01:39<00:17, 13.39it/s]
 84%|████████▎ | 1199/1435 [01:39<00:17, 13.31it/s]
 84%|████████▎ | 1201/1435 [01:39<00:17, 13.29it/s]
 84%|████████▍ | 1203/1435 [01:39<00:17, 13.34it/s]
 84%|████████▍ | 1205/1435 [01:39<00:17, 13.36it/s]
 84%|████████▍ | 1207/1435 [01:39<00:17, 13.34it/s]
 84%|████████▍ | 1209/1435 [01:40<00:16, 13.30it/s]
 84%|████████▍ | 1211/1435 [01:40<00:16, 13.33it/s]
 85%|███████

== Status ==
Current time: 2024-03-07 21:27:02 (running for 00:01:51.63)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 87%|████████▋ | 1245/1435 [01:42<00:14, 13.30it/s]
 87%|████████▋ | 1247/1435 [01:42<00:14, 13.31it/s]
 87%|████████▋ | 1249/1435 [01:43<00:13, 13.32it/s]
 87%|████████▋ | 1251/1435 [01:43<00:13, 13.34it/s]
 87%|████████▋ | 1253/1435 [01:43<00:13, 13.35it/s]
 87%|████████▋ | 1255/1435 [01:43<00:13, 13.31it/s]
 88%|████████▊ | 1257/1435 [01:43<00:13, 13.34it/s]
 88%|████████▊ | 1259/1435 [01:43<00:13, 13.36it/s]
 88%|████████▊ | 1261/1435 [01:43<00:13, 13.32it/s]
 88%|████████▊ | 1263/1435 [01:44<00:12, 13.31it/s]
 88%|████████▊ | 1265/1435 [01:44<00:12, 13.32it/s]
 88%|████████▊ | 1267/1435 [01:44<00:12, 13.33it/s]
 88%|████████▊ | 1269/1435 [01:44<00:12, 13.29it/s]
 89%|████████▊ | 1271/1435 [01:44<00:12, 13.30it/s]
 89%|████████▊ | 1273/1435 [01:44<00:12, 13.34it/s]
 89%|████████▉ | 1275/1435 [01:44<00:12, 13.30it/s]
 89%|████████▉ | 1277/1435 [01:45<00:11, 13.33it/s]
 89%|████████▉ | 1279/1435 [01:45<00:11, 13.31it/s]
 89%|████████▉ | 1281/1435 [01:45<00:11, 13.29it/s]
 89%|███████

== Status ==
Current time: 2024-03-07 21:27:07 (running for 00:01:56.67)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 91%|█████████▏| 1311/1435 [01:47<00:09, 13.34it/s]
 91%|█████████▏| 1313/1435 [01:47<00:09, 13.36it/s]
 92%|█████████▏| 1315/1435 [01:47<00:08, 13.35it/s]
 92%|█████████▏| 1317/1435 [01:48<00:08, 13.37it/s]
 92%|█████████▏| 1319/1435 [01:48<00:08, 13.33it/s]
 92%|█████████▏| 1321/1435 [01:48<00:08, 13.31it/s]
 92%|█████████▏| 1323/1435 [01:48<00:08, 13.32it/s]
 92%|█████████▏| 1325/1435 [01:48<00:08, 13.35it/s]
 92%|█████████▏| 1327/1435 [01:48<00:08, 13.33it/s]
 93%|█████████▎| 1329/1435 [01:49<00:07, 13.32it/s]
 93%|█████████▎| 1331/1435 [01:49<00:07, 13.31it/s]
 93%|█████████▎| 1333/1435 [01:49<00:07, 13.29it/s]
 93%|█████████▎| 1335/1435 [01:49<00:07, 13.28it/s]
 93%|█████████▎| 1337/1435 [01:49<00:07, 13.24it/s]
 93%|█████████▎| 1339/1435 [01:49<00:07, 13.28it/s]
 93%|█████████▎| 1341/1435 [01:49<00:07, 13.29it/s]
 94%|█████████▎| 1343/1435 [01:50<00:06, 13.26it/s]
 94%|█████████▎| 1345/1435 [01:50<00:06, 13.30it/s]
 94%|█████████▍| 1347/1435 [01:50<00:06, 13.32it/s]
 94%|███████

== Status ==
Current time: 2024-03-07 21:27:12 (running for 00:02:01.71)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

 96%|█████████▌| 1377/1435 [01:52<00:04, 13.30it/s]
 96%|█████████▌| 1379/1435 [01:52<00:04, 13.33it/s]
 96%|█████████▌| 1381/1435 [01:52<00:04, 13.33it/s]
 96%|█████████▋| 1383/1435 [01:53<00:03, 13.28it/s]
 97%|█████████▋| 1385/1435 [01:53<00:03, 13.30it/s]
 97%|█████████▋| 1387/1435 [01:53<00:03, 13.35it/s]
 97%|█████████▋| 1389/1435 [01:53<00:03, 13.33it/s]
 97%|█████████▋| 1391/1435 [01:53<00:03, 13.36it/s]
 97%|█████████▋| 1393/1435 [01:53<00:03, 13.36it/s]
 97%|█████████▋| 1395/1435 [01:53<00:02, 13.35it/s]
 97%|█████████▋| 1397/1435 [01:54<00:02, 13.36it/s]
 97%|█████████▋| 1399/1435 [01:54<00:02, 13.30it/s]
 98%|█████████▊| 1401/1435 [01:54<00:02, 13.32it/s]
 98%|█████████▊| 1403/1435 [01:54<00:02, 13.33it/s]
 98%|█████████▊| 1405/1435 [01:54<00:02, 13.39it/s]
 98%|█████████▊| 1407/1435 [01:54<00:02, 13.41it/s]
 98%|█████████▊| 1409/1435 [01:55<00:01, 13.42it/s]
 98%|█████████▊| 1411/1435 [01:55<00:01, 13.42it/s]
 98%|█████████▊| 1413/1435 [01:55<00:01, 13.43it/s]
 99%|███████

== Status ==
Current time: 2024-03-07 21:27:17 (running for 00:02:06.75)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 RUNNING)
+------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status   | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |          |                 |                 |                    |                ch_size |                |             |
|------------------------+----------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | RUNNING  | 172.19.0.1:7911 |     5.61152e-06 |                  5 |    

[36m(_objective pid=7911)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.12it/s][A
[36m(_objective pid=7911)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.46it/s][A
[36m(_objective pid=7911)[0m 
                                                   
100%|██████████| 1435/1435 [01:58<00:00, 13.38it/s]
100%|██████████| 5/5 [00:01<00:00,  4.30it/s][A
100%|██████████| 1435/1435 [01:58<00:00, 12.13it/s]


[36m(_objective pid=7911)[0m {'eval_loss': 0.8510650396347046, 'eval_accuracy': 0.5949367088607594, 'eval_runtime': 1.3529, 'eval_samples_per_second': 58.392, 'eval_steps_per_second': 3.696, 'epoch': 5.0}
[36m(_objective pid=7911)[0m {'train_runtime': 118.3276, 'train_samples_per_second': 12.127, 'train_steps_per_second': 12.127, 'train_loss': 0.6640387664688588, 'epoch': 5.0}
== Status ==
Current time: 2024-03-07 21:27:22 (running for 00:02:11.83)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (14 PENDING, 1 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|        

[36m(_objective pid=8293)[0m 2024-03-07 21:27:24.653061: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=8293)[0m 2024-03-07 21:27:24.653113: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=8293)[0m 2024-03-07 21:27:24.654370: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
[36m(_objective pid=8293)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']

== Status ==
Current time: 2024-03-07 21:27:27 (running for 00:02:16.92)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (13 PENDING, 1 RUNNING, 1 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00001 | RUNNING    | 172.19.0.1:8293 |     1.57513e-05 | 

  0%|          | 0/108 [00:00<?, ?it/s]
  1%|          | 1/108 [00:00<01:05,  1.62it/s]
  2%|▏         | 2/108 [00:00<00:50,  2.11it/s]
  3%|▎         | 3/108 [00:01<00:45,  2.31it/s]
  4%|▎         | 4/108 [00:01<00:42,  2.43it/s]
  5%|▍         | 5/108 [00:02<00:40,  2.52it/s]
  6%|▌         | 6/108 [00:02<00:39,  2.56it/s]
  6%|▋         | 7/108 [00:02<00:38,  2.60it/s]
  7%|▋         | 8/108 [00:03<00:37,  2.63it/s]
  8%|▊         | 9/108 [00:03<00:37,  2.64it/s]
  9%|▉         | 10/108 [00:03<00:36,  2.65it/s]
 10%|█         | 11/108 [00:04<00:36,  2.66it/s]
 11%|█         | 12/108 [00:04<00:36,  2.66it/s]


== Status ==
Current time: 2024-03-07 21:27:32 (running for 00:02:21.95)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (13 PENDING, 1 RUNNING, 1 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00001 | RUNNING    | 172.19.0.1:8293 |     1.57513e-05 | 

 12%|█▏        | 13/108 [00:05<00:35,  2.66it/s]
 13%|█▎        | 14/108 [00:05<00:35,  2.66it/s]
 14%|█▍        | 15/108 [00:05<00:34,  2.67it/s]
 15%|█▍        | 16/108 [00:06<00:34,  2.67it/s]
 16%|█▌        | 17/108 [00:06<00:34,  2.67it/s]
 17%|█▋        | 18/108 [00:06<00:33,  2.67it/s]
 18%|█▊        | 19/108 [00:07<00:33,  2.64it/s]
 19%|█▊        | 20/108 [00:07<00:33,  2.64it/s]
 19%|█▉        | 21/108 [00:08<00:32,  2.64it/s]
 20%|██        | 22/108 [00:08<00:32,  2.65it/s]
 21%|██▏       | 23/108 [00:08<00:32,  2.65it/s]
 22%|██▏       | 24/108 [00:09<00:31,  2.65it/s]
 23%|██▎       | 25/108 [00:09<00:31,  2.64it/s]


== Status ==
Current time: 2024-03-07 21:27:37 (running for 00:02:27.00)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (13 PENDING, 1 RUNNING, 1 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00001 | RUNNING    | 172.19.0.1:8293 |     1.57513e-05 | 

 24%|██▍       | 26/108 [00:10<00:30,  2.66it/s]
 25%|██▌       | 27/108 [00:10<00:30,  2.67it/s]
 26%|██▌       | 28/108 [00:10<00:30,  2.66it/s]
 27%|██▋       | 29/108 [00:11<00:29,  2.66it/s]
 28%|██▊       | 30/108 [00:11<00:29,  2.67it/s]
 29%|██▊       | 31/108 [00:11<00:28,  2.68it/s]
 30%|██▉       | 32/108 [00:12<00:28,  2.67it/s]
 31%|███       | 33/108 [00:12<00:28,  2.65it/s]
 31%|███▏      | 34/108 [00:13<00:28,  2.62it/s]
 32%|███▏      | 35/108 [00:13<00:27,  2.63it/s]
 33%|███▎      | 36/108 [00:13<00:26,  2.73it/s]
[36m(_objective pid=8293)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=8293)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.25it/s][A
[36m(_objective pid=8293)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.15it/s][A
[36m(_objective pid=8293)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.36it/s][A


== Status ==
Current time: 2024-03-07 21:27:42 (running for 00:02:32.04)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (13 PENDING, 1 RUNNING, 1 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00001 | RUNNING    | 172.19.0.1:8293 |     1.57513e-05 | 

[36m(_objective pid=8293)[0m 
                                                
 33%|███▎      | 36/108 [00:15<00:26,  2.73it/s]
100%|██████████| 5/5 [00:01<00:00,  4.21it/s][A
                                             [A
 34%|███▍      | 37/108 [00:15<00:55,  1.27it/s]
 35%|███▌      | 38/108 [00:15<00:46,  1.51it/s]
 36%|███▌      | 39/108 [00:16<00:39,  1.73it/s]
 37%|███▋      | 40/108 [00:16<00:35,  1.93it/s]
 38%|███▊      | 41/108 [00:17<00:31,  2.10it/s]
 39%|███▉      | 42/108 [00:17<00:29,  2.24it/s]
 40%|███▉      | 43/108 [00:17<00:27,  2.35it/s]
 41%|████      | 44/108 [00:18<00:26,  2.44it/s]
 42%|████▏     | 45/108 [00:18<00:25,  2.50it/s]
 43%|████▎     | 46/108 [00:18<00:24,  2.54it/s]
 44%|████▎     | 47/108 [00:19<00:23,  2.58it/s]
 44%|████▍     | 48/108 [00:19<00:22,  2.62it/s]
 45%|████▌     | 49/108 [00:20<00:22,  2.63it/s]


== Status ==
Current time: 2024-03-07 21:27:48 (running for 00:02:37.11)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (13 PENDING, 1 RUNNING, 1 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00001 | RUNNING    | 172.19.0.1:8293 |     1.57513e-05 | 

 46%|████▋     | 50/108 [00:20<00:21,  2.65it/s]
 47%|████▋     | 51/108 [00:20<00:21,  2.66it/s]
 48%|████▊     | 52/108 [00:21<00:21,  2.66it/s]
 49%|████▉     | 53/108 [00:21<00:20,  2.66it/s]
 50%|█████     | 54/108 [00:21<00:20,  2.66it/s]
 51%|█████     | 55/108 [00:22<00:19,  2.66it/s]
 52%|█████▏    | 56/108 [00:22<00:19,  2.66it/s]
 53%|█████▎    | 57/108 [00:23<00:19,  2.67it/s]
 54%|█████▎    | 58/108 [00:23<00:18,  2.66it/s]
 55%|█████▍    | 59/108 [00:23<00:18,  2.67it/s]
 56%|█████▌    | 60/108 [00:24<00:17,  2.68it/s]
 56%|█████▋    | 61/108 [00:24<00:17,  2.67it/s]
 57%|█████▋    | 62/108 [00:24<00:17,  2.68it/s]


== Status ==
Current time: 2024-03-07 21:27:53 (running for 00:02:42.15)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (13 PENDING, 1 RUNNING, 1 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00001 | RUNNING    | 172.19.0.1:8293 |     1.57513e-05 | 

 58%|█████▊    | 63/108 [00:25<00:16,  2.68it/s]
 59%|█████▉    | 64/108 [00:25<00:16,  2.67it/s]
 60%|██████    | 65/108 [00:26<00:16,  2.67it/s]
 61%|██████    | 66/108 [00:26<00:15,  2.67it/s]
 62%|██████▏   | 67/108 [00:26<00:15,  2.67it/s]
 63%|██████▎   | 68/108 [00:27<00:14,  2.67it/s]
 64%|██████▍   | 69/108 [00:27<00:14,  2.67it/s]
 65%|██████▍   | 70/108 [00:27<00:14,  2.67it/s]
 66%|██████▌   | 71/108 [00:28<00:13,  2.68it/s]
 67%|██████▋   | 72/108 [00:28<00:13,  2.77it/s]
[36m(_objective pid=8293)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=8293)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.31it/s][A
[36m(_objective pid=8293)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.14it/s][A
[36m(_objective pid=8293)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.45it/s][A
[36m(_objective pid=8293)[0m 
                                                
 67%|██████▋   | 72/108 [00:29<00:13,  2.77it/s]
100%|██████████| 5/5 [00:01<00:00,  4.30it/s][A
               

[36m(_objective pid=8293)[0m {'eval_loss': 0.6520819067955017, 'eval_accuracy': 0.620253164556962, 'eval_runtime': 1.3529, 'eval_samples_per_second': 58.394, 'eval_steps_per_second': 3.696, 'epoch': 2.0}
== Status ==
Current time: 2024-03-07 21:27:58 (running for 00:02:47.19)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (13 PENDING, 1 RUNNING, 1 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|----------------------

 68%|██████▊   | 73/108 [00:30<00:27,  1.29it/s]
 69%|██████▊   | 74/108 [00:30<00:22,  1.53it/s]
 69%|██████▉   | 75/108 [00:31<00:18,  1.76it/s]
 70%|███████   | 76/108 [00:31<00:16,  1.96it/s]
 71%|███████▏  | 77/108 [00:31<00:14,  2.13it/s]
 72%|███████▏  | 78/108 [00:32<00:13,  2.27it/s]
 73%|███████▎  | 79/108 [00:32<00:12,  2.38it/s]
 74%|███████▍  | 80/108 [00:32<00:11,  2.46it/s]
 75%|███████▌  | 81/108 [00:33<00:10,  2.52it/s]
 76%|███████▌  | 82/108 [00:33<00:10,  2.56it/s]
 77%|███████▋  | 83/108 [00:34<00:09,  2.60it/s]
 78%|███████▊  | 84/108 [00:34<00:09,  2.62it/s]
 79%|███████▊  | 85/108 [00:34<00:08,  2.63it/s]
 80%|███████▉  | 86/108 [00:35<00:08,  2.64it/s]


== Status ==
Current time: 2024-03-07 21:28:03 (running for 00:02:52.23)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (13 PENDING, 1 RUNNING, 1 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00001 | RUNNING    | 172.19.0.1:8293 |     1.57513e-05 | 

 81%|████████  | 87/108 [00:35<00:07,  2.66it/s]
 81%|████████▏ | 88/108 [00:35<00:07,  2.66it/s]
 82%|████████▏ | 89/108 [00:36<00:07,  2.66it/s]
 83%|████████▎ | 90/108 [00:36<00:06,  2.67it/s]
 84%|████████▍ | 91/108 [00:37<00:06,  2.68it/s]
 85%|████████▌ | 92/108 [00:37<00:05,  2.68it/s]
 86%|████████▌ | 93/108 [00:37<00:05,  2.68it/s]
 87%|████████▋ | 94/108 [00:38<00:05,  2.69it/s]
 88%|████████▊ | 95/108 [00:38<00:04,  2.68it/s]
 89%|████████▉ | 96/108 [00:38<00:04,  2.68it/s]
 90%|████████▉ | 97/108 [00:39<00:04,  2.68it/s]
 91%|█████████ | 98/108 [00:39<00:03,  2.68it/s]
 92%|█████████▏| 99/108 [00:40<00:03,  2.68it/s]


== Status ==
Current time: 2024-03-07 21:28:08 (running for 00:02:57.27)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (13 PENDING, 1 RUNNING, 1 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00001 | RUNNING    | 172.19.0.1:8293 |     1.57513e-05 | 

 93%|█████████▎| 100/108 [00:40<00:02,  2.67it/s]
 94%|█████████▎| 101/108 [00:40<00:02,  2.68it/s]
 94%|█████████▍| 102/108 [00:41<00:02,  2.68it/s]
 95%|█████████▌| 103/108 [00:41<00:01,  2.68it/s]
 96%|█████████▋| 104/108 [00:41<00:01,  2.68it/s]
 97%|█████████▋| 105/108 [00:42<00:01,  2.68it/s]
 98%|█████████▊| 106/108 [00:42<00:00,  2.68it/s]
 99%|█████████▉| 107/108 [00:43<00:00,  2.68it/s]
100%|██████████| 108/108 [00:43<00:00,  2.77it/s]
[36m(_objective pid=8293)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=8293)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.33it/s][A
[36m(_objective pid=8293)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.16it/s][A
[36m(_objective pid=8293)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.49it/s][A
[36m(_objective pid=8293)[0m 
                                                 
100%|██████████| 108/108 [00:44<00:00,  2.77it/s]
100%|██████████| 5/5 [00:01<00:00,  4.31it/s][A
100%|██████████| 108/108 [00:44<00:00,  2.42it/s]


[36m(_objective pid=8293)[0m {'eval_loss': 0.6383227705955505, 'eval_accuracy': 0.6582278481012658, 'eval_runtime': 1.3484, 'eval_samples_per_second': 58.587, 'eval_steps_per_second': 3.708, 'epoch': 3.0}
[36m(_objective pid=8293)[0m {'train_runtime': 44.7115, 'train_samples_per_second': 19.257, 'train_steps_per_second': 2.415, 'train_loss': 0.6556137226246022, 'epoch': 3.0}
== Status ==
Current time: 2024-03-07 21:28:13 (running for 00:03:02.36)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (13 PENDING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|          

[36m(_objective pid=8488)[0m 2024-03-07 21:28:18.638261: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=8488)[0m 2024-03-07 21:28:18.638315: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=8488)[0m 2024-03-07 21:28:18.639673: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
[36m(_objective pid=8488)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']

== Status ==
Current time: 2024-03-07 21:28:23 (running for 00:03:12.50)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

  1%|▏         | 21/1435 [00:01<01:47, 13.16it/s]
  2%|▏         | 23/1435 [00:01<01:46, 13.21it/s]
  2%|▏         | 25/1435 [00:02<01:47, 13.15it/s]
  2%|▏         | 27/1435 [00:02<01:46, 13.23it/s]
  2%|▏         | 29/1435 [00:02<01:45, 13.27it/s]
  2%|▏         | 31/1435 [00:02<01:45, 13.26it/s]
  2%|▏         | 33/1435 [00:02<01:45, 13.24it/s]
  2%|▏         | 35/1435 [00:02<01:45, 13.29it/s]
  3%|▎         | 37/1435 [00:03<01:45, 13.30it/s]
  3%|▎         | 39/1435 [00:03<01:45, 13.27it/s]
  3%|▎         | 41/1435 [00:03<01:45, 13.22it/s]
  3%|▎         | 43/1435 [00:03<01:45, 13.19it/s]
  3%|▎         | 45/1435 [00:03<01:45, 13.17it/s]
  3%|▎         | 47/1435 [00:03<01:44, 13.25it/s]
  3%|▎         | 49/1435 [00:03<01:44, 13.29it/s]
  4%|▎         | 51/1435 [00:04<01:43, 13.34it/s]
  4%|▎         | 53/1435 [00:04<01:43, 13.29it/s]
  4%|▍         | 55/1435 [00:04<01:43, 13.29it/s]
  4%|▍         | 57/1435 [00:04<01:43, 13.29it/s]
  4%|▍         | 59/1435 [00:04<01:43, 13.30it/s]


== Status ==
Current time: 2024-03-07 21:28:28 (running for 00:03:17.54)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

  6%|▌         | 87/1435 [00:06<01:41, 13.32it/s]
  6%|▌         | 89/1435 [00:06<01:41, 13.32it/s]
  6%|▋         | 91/1435 [00:07<01:40, 13.34it/s]
  6%|▋         | 93/1435 [00:07<01:40, 13.33it/s]
  7%|▋         | 95/1435 [00:07<01:40, 13.31it/s]
  7%|▋         | 97/1435 [00:07<01:40, 13.37it/s]
  7%|▋         | 99/1435 [00:07<01:40, 13.34it/s]
  7%|▋         | 101/1435 [00:07<01:40, 13.34it/s]
  7%|▋         | 103/1435 [00:07<01:39, 13.36it/s]
  7%|▋         | 105/1435 [00:08<01:39, 13.39it/s]
  7%|▋         | 107/1435 [00:08<01:39, 13.36it/s]
  8%|▊         | 109/1435 [00:08<01:39, 13.33it/s]
  8%|▊         | 111/1435 [00:08<01:39, 13.31it/s]
  8%|▊         | 113/1435 [00:08<01:39, 13.30it/s]
  8%|▊         | 115/1435 [00:08<01:39, 13.28it/s]
  8%|▊         | 117/1435 [00:09<01:39, 13.25it/s]
  8%|▊         | 119/1435 [00:09<01:38, 13.32it/s]
  8%|▊         | 121/1435 [00:09<01:38, 13.34it/s]
  9%|▊         | 123/1435 [00:09<01:38, 13.37it/s]
  9%|▊         | 125/1435 [00:09<01:38

== Status ==
Current time: 2024-03-07 21:28:33 (running for 00:03:22.58)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 11%|█         | 153/1435 [00:11<01:36, 13.28it/s]
 11%|█         | 155/1435 [00:11<01:35, 13.34it/s]
 11%|█         | 157/1435 [00:12<01:36, 13.29it/s]
 11%|█         | 159/1435 [00:12<01:35, 13.32it/s]
 11%|█         | 161/1435 [00:12<01:35, 13.37it/s]
 11%|█▏        | 163/1435 [00:12<01:35, 13.39it/s]
 11%|█▏        | 165/1435 [00:12<01:35, 13.33it/s]
 12%|█▏        | 167/1435 [00:12<01:34, 13.37it/s]
 12%|█▏        | 169/1435 [00:12<01:34, 13.38it/s]
 12%|█▏        | 171/1435 [00:13<01:34, 13.37it/s]
 12%|█▏        | 173/1435 [00:13<01:34, 13.31it/s]
 12%|█▏        | 175/1435 [00:13<01:34, 13.30it/s]
 12%|█▏        | 177/1435 [00:13<01:34, 13.28it/s]
 12%|█▏        | 179/1435 [00:13<01:34, 13.30it/s]
 13%|█▎        | 181/1435 [00:13<01:34, 13.30it/s]
 13%|█▎        | 183/1435 [00:13<01:34, 13.31it/s]
 13%|█▎        | 185/1435 [00:14<01:33, 13.33it/s]
 13%|█▎        | 187/1435 [00:14<01:33, 13.31it/s]
 13%|█▎        | 189/1435 [00:14<01:33, 13.28it/s]
 13%|█▎        | 191/1435 [00:1

== Status ==
Current time: 2024-03-07 21:28:38 (running for 00:03:27.61)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 16%|█▌        | 223/1435 [00:16<01:30, 13.36it/s]
 16%|█▌        | 225/1435 [00:17<01:30, 13.39it/s]
 16%|█▌        | 227/1435 [00:17<01:30, 13.36it/s]
 16%|█▌        | 229/1435 [00:17<01:30, 13.36it/s]
 16%|█▌        | 231/1435 [00:17<01:30, 13.32it/s]
 16%|█▌        | 233/1435 [00:17<01:30, 13.29it/s]
 16%|█▋        | 235/1435 [00:17<01:30, 13.32it/s]
 17%|█▋        | 237/1435 [00:18<01:29, 13.32it/s]
 17%|█▋        | 239/1435 [00:18<01:29, 13.34it/s]
 17%|█▋        | 241/1435 [00:18<01:29, 13.35it/s]
 17%|█▋        | 243/1435 [00:18<01:29, 13.37it/s]
 17%|█▋        | 245/1435 [00:18<01:29, 13.34it/s]
 17%|█▋        | 247/1435 [00:18<01:29, 13.33it/s]
 17%|█▋        | 249/1435 [00:18<01:29, 13.31it/s]
 17%|█▋        | 251/1435 [00:19<01:28, 13.32it/s]
 18%|█▊        | 253/1435 [00:19<01:28, 13.33it/s]
 18%|█▊        | 255/1435 [00:19<01:28, 13.32it/s]
 18%|█▊        | 257/1435 [00:19<01:28, 13.30it/s]
 18%|█▊        | 259/1435 [00:19<01:28, 13.33it/s]
 18%|█▊        | 261/1435 [00:1

== Status ==
Current time: 2024-03-07 21:28:43 (running for 00:03:32.64)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

[36m(_objective pid=8488)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=8488)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.27it/s][A
[36m(_objective pid=8488)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.17it/s][A
[36m(_objective pid=8488)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.49it/s][A


[36m(_objective pid=8488)[0m {'eval_loss': 0.6920689940452576, 'eval_accuracy': 0.569620253164557, 'eval_runtime': 1.3604, 'eval_samples_per_second': 58.072, 'eval_steps_per_second': 3.675, 'epoch': 1.0}


[36m(_objective pid=8488)[0m 
                                                  
 20%|██        | 287/1435 [00:23<01:26, 13.29it/s]
100%|██████████| 5/5 [00:01<00:00,  4.31it/s][A
                                             [A
 20%|██        | 289/1435 [00:23<05:20,  3.57it/s]
 20%|██        | 291/1435 [00:23<04:10,  4.58it/s]
 20%|██        | 293/1435 [00:23<03:20,  5.70it/s]
 21%|██        | 295/1435 [00:23<02:45,  6.88it/s]
 21%|██        | 297/1435 [00:23<02:21,  8.04it/s]
 21%|██        | 299/1435 [00:24<02:04,  9.14it/s]
 21%|██        | 301/1435 [00:24<01:52, 10.10it/s]
 21%|██        | 303/1435 [00:24<01:45, 10.78it/s]
 21%|██▏       | 305/1435 [00:24<01:39, 11.31it/s]
 21%|██▏       | 307/1435 [00:24<01:36, 11.73it/s]
 22%|██▏       | 309/1435 [00:24<01:32, 12.16it/s]
 22%|██▏       | 311/1435 [00:24<01:29, 12.49it/s]
 22%|██▏       | 313/1435 [00:25<01:27, 12.76it/s]
 22%|██▏       | 315/1435 [00:25<01:26, 12.92it/s]
 22%|██▏       | 317/1435 [00:25<01:25, 13.07it/s]
 22

== Status ==
Current time: 2024-03-07 21:28:48 (running for 00:03:37.65)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 23%|██▎       | 337/1435 [00:26<01:22, 13.30it/s]
 24%|██▎       | 339/1435 [00:27<01:22, 13.34it/s]
 24%|██▍       | 341/1435 [00:27<01:21, 13.35it/s]
 24%|██▍       | 343/1435 [00:27<01:21, 13.33it/s]
 24%|██▍       | 345/1435 [00:27<01:21, 13.39it/s]
 24%|██▍       | 347/1435 [00:27<01:21, 13.38it/s]
 24%|██▍       | 349/1435 [00:27<01:21, 13.38it/s]
 24%|██▍       | 351/1435 [00:27<01:21, 13.34it/s]
 25%|██▍       | 353/1435 [00:28<01:21, 13.33it/s]
 25%|██▍       | 355/1435 [00:28<01:20, 13.34it/s]
 25%|██▍       | 357/1435 [00:28<01:20, 13.35it/s]
 25%|██▌       | 359/1435 [00:28<01:20, 13.33it/s]
 25%|██▌       | 361/1435 [00:28<01:20, 13.33it/s]
 25%|██▌       | 363/1435 [00:28<01:20, 13.35it/s]
 25%|██▌       | 365/1435 [00:29<01:20, 13.37it/s]
 26%|██▌       | 367/1435 [00:29<01:20, 13.33it/s]
 26%|██▌       | 369/1435 [00:29<01:19, 13.36it/s]
 26%|██▌       | 371/1435 [00:29<01:19, 13.39it/s]
 26%|██▌       | 373/1435 [00:29<01:19, 13.39it/s]
 26%|██▌       | 375/1435 [00:2

== Status ==
Current time: 2024-03-07 21:28:53 (running for 00:03:42.69)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 28%|██▊       | 403/1435 [00:31<01:17, 13.33it/s]
 28%|██▊       | 405/1435 [00:31<01:17, 13.34it/s]
 28%|██▊       | 407/1435 [00:32<01:17, 13.31it/s]
 29%|██▊       | 409/1435 [00:32<01:17, 13.18it/s]
 29%|██▊       | 411/1435 [00:32<01:17, 13.24it/s]
 29%|██▉       | 413/1435 [00:32<01:17, 13.24it/s]
 29%|██▉       | 415/1435 [00:32<01:16, 13.26it/s]
 29%|██▉       | 417/1435 [00:32<01:16, 13.29it/s]
 29%|██▉       | 419/1435 [00:33<01:16, 13.34it/s]
 29%|██▉       | 421/1435 [00:33<01:15, 13.36it/s]
 29%|██▉       | 423/1435 [00:33<01:15, 13.34it/s]
 30%|██▉       | 425/1435 [00:33<01:15, 13.36it/s]
 30%|██▉       | 427/1435 [00:33<01:15, 13.33it/s]
 30%|██▉       | 429/1435 [00:33<01:15, 13.33it/s]
 30%|███       | 431/1435 [00:33<01:15, 13.34it/s]
 30%|███       | 433/1435 [00:34<01:15, 13.33it/s]
 30%|███       | 435/1435 [00:34<01:15, 13.32it/s]
 30%|███       | 437/1435 [00:34<01:14, 13.36it/s]
 31%|███       | 439/1435 [00:34<01:14, 13.37it/s]
 31%|███       | 441/1435 [00:3

== Status ==
Current time: 2024-03-07 21:28:58 (running for 00:03:47.73)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 33%|███▎      | 469/1435 [00:36<01:12, 13.37it/s]
 33%|███▎      | 471/1435 [00:36<01:12, 13.34it/s]
 33%|███▎      | 473/1435 [00:37<01:12, 13.32it/s]
 33%|███▎      | 475/1435 [00:37<01:12, 13.29it/s]
 33%|███▎      | 477/1435 [00:37<01:12, 13.30it/s]
 33%|███▎      | 479/1435 [00:37<01:12, 13.27it/s]
 34%|███▎      | 481/1435 [00:37<01:11, 13.26it/s]
 34%|███▎      | 483/1435 [00:37<01:12, 13.18it/s]
 34%|███▍      | 485/1435 [00:38<01:11, 13.20it/s]
 34%|███▍      | 487/1435 [00:38<01:11, 13.25it/s]
 34%|███▍      | 489/1435 [00:38<01:11, 13.23it/s]
 34%|███▍      | 491/1435 [00:38<01:11, 13.28it/s]
 34%|███▍      | 493/1435 [00:38<01:10, 13.30it/s]
 34%|███▍      | 495/1435 [00:38<01:10, 13.31it/s]
 35%|███▍      | 497/1435 [00:38<01:10, 13.32it/s]


[36m(_objective pid=8488)[0m {'loss': 0.6954, 'grad_norm': 9.359814643859863, 'learning_rate': 8.513868423400589e-07, 'epoch': 1.74}


 35%|███▍      | 500/1435 [00:39<01:10, 13.33it/s]
 35%|███▍      | 501/1435 [00:40<04:55,  3.16it/s]
 35%|███▌      | 503/1435 [00:40<03:47,  4.10it/s]
 35%|███▌      | 505/1435 [00:41<02:59,  5.18it/s]
 35%|███▌      | 507/1435 [00:41<02:26,  6.35it/s]
 35%|███▌      | 509/1435 [00:41<02:02,  7.54it/s]
 36%|███▌      | 511/1435 [00:41<01:46,  8.67it/s]
 36%|███▌      | 513/1435 [00:41<01:35,  9.69it/s]


== Status ==
Current time: 2024-03-07 21:29:03 (running for 00:03:52.77)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 36%|███▌      | 515/1435 [00:41<01:27, 10.55it/s]
 36%|███▌      | 517/1435 [00:42<01:21, 11.26it/s]
 36%|███▌      | 519/1435 [00:42<01:17, 11.83it/s]
 36%|███▋      | 521/1435 [00:42<01:14, 12.20it/s]
 36%|███▋      | 523/1435 [00:42<01:12, 12.54it/s]
 37%|███▋      | 525/1435 [00:42<01:11, 12.74it/s]
 37%|███▋      | 527/1435 [00:42<01:10, 12.92it/s]
 37%|███▋      | 529/1435 [00:42<01:09, 13.04it/s]
 37%|███▋      | 531/1435 [00:43<01:08, 13.10it/s]
 37%|███▋      | 533/1435 [00:43<01:08, 13.19it/s]
 37%|███▋      | 535/1435 [00:43<01:07, 13.24it/s]
 37%|███▋      | 537/1435 [00:43<01:07, 13.25it/s]
 38%|███▊      | 539/1435 [00:43<01:07, 13.29it/s]
 38%|███▊      | 541/1435 [00:43<01:07, 13.32it/s]
 38%|███▊      | 543/1435 [00:43<01:06, 13.32it/s]
 38%|███▊      | 545/1435 [00:44<01:07, 13.26it/s]
 38%|███▊      | 547/1435 [00:44<01:06, 13.28it/s]
 38%|███▊      | 549/1435 [00:44<01:06, 13.32it/s]
 38%|███▊      | 551/1435 [00:44<01:06, 13.30it/s]
 39%|███▊      | 553/1435 [00:4

== Status ==
Current time: 2024-03-07 21:29:08 (running for 00:03:57.80)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

[36m(_objective pid=8488)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.14it/s][A
[36m(_objective pid=8488)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.47it/s][A


[36m(_objective pid=8488)[0m {'eval_loss': 0.6895374655723572, 'eval_accuracy': 0.5569620253164557, 'eval_runtime': 1.3559, 'eval_samples_per_second': 58.262, 'eval_steps_per_second': 3.687, 'epoch': 2.0}


[36m(_objective pid=8488)[0m 
                                                  
 40%|████      | 574/1435 [00:47<01:04, 13.44it/s]
100%|██████████| 5/5 [00:01<00:00,  4.28it/s][A
 40%|████      | 575/1435 [00:47<03:58,  3.60it/s]
 40%|████      | 577/1435 [00:47<03:06,  4.61it/s]
 40%|████      | 579/1435 [00:48<02:29,  5.74it/s]
 40%|████      | 581/1435 [00:48<02:03,  6.93it/s]
 41%|████      | 583/1435 [00:48<01:45,  8.09it/s]
 41%|████      | 585/1435 [00:48<01:32,  9.17it/s]
 41%|████      | 587/1435 [00:48<01:23, 10.11it/s]
 41%|████      | 589/1435 [00:48<01:17, 10.89it/s]
 41%|████      | 591/1435 [00:48<01:13, 11.49it/s]
 41%|████▏     | 593/1435 [00:49<01:10, 11.99it/s]
 41%|████▏     | 595/1435 [00:49<01:07, 12.37it/s]
 42%|████▏     | 597/1435 [00:49<01:06, 12.65it/s]
 42%|████▏     | 599/1435 [00:49<01:05, 12.85it/s]
 42%|████▏     | 601/1435 [00:49<01:04, 12.99it/s]
 42%|████▏     | 603/1435 [00:49<01:03, 13.13it/s]
 42%|████▏     | 605/1435 [00:49<01:03, 13.17it/s]
 

== Status ==
Current time: 2024-03-07 21:29:13 (running for 00:04:02.85)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 44%|████▍     | 631/1435 [00:51<01:00, 13.28it/s]
 44%|████▍     | 633/1435 [00:52<01:00, 13.28it/s]
 44%|████▍     | 635/1435 [00:52<01:00, 13.30it/s]
 44%|████▍     | 637/1435 [00:52<01:00, 13.26it/s]
 45%|████▍     | 639/1435 [00:52<00:59, 13.27it/s]
 45%|████▍     | 641/1435 [00:52<00:59, 13.25it/s]
 45%|████▍     | 643/1435 [00:52<00:59, 13.30it/s]
 45%|████▍     | 645/1435 [00:52<00:59, 13.33it/s]
 45%|████▌     | 647/1435 [00:53<00:59, 13.33it/s]
 45%|████▌     | 649/1435 [00:53<01:37,  8.10it/s]
 45%|████▌     | 651/1435 [00:53<01:25,  9.16it/s]
 46%|████▌     | 653/1435 [00:53<01:17, 10.10it/s]
 46%|████▌     | 655/1435 [00:54<01:11, 10.86it/s]
 46%|████▌     | 657/1435 [00:54<01:07, 11.47it/s]
 46%|████▌     | 659/1435 [00:54<01:05, 11.80it/s]
 46%|████▌     | 661/1435 [00:54<01:04, 12.01it/s]
 46%|████▌     | 663/1435 [00:54<01:02, 12.34it/s]
 46%|████▋     | 665/1435 [00:54<01:01, 12.62it/s]
 46%|████▋     | 667/1435 [00:54<00:59, 12.87it/s]
 47%|████▋     | 669/1435 [00:5

== Status ==
Current time: 2024-03-07 21:29:18 (running for 00:04:07.86)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 48%|████▊     | 695/1435 [00:57<00:55, 13.22it/s]
 49%|████▊     | 697/1435 [00:57<00:55, 13.23it/s]
 49%|████▊     | 699/1435 [00:57<00:55, 13.22it/s]
 49%|████▉     | 701/1435 [00:57<00:55, 13.24it/s]
 49%|████▉     | 703/1435 [00:57<00:55, 13.25it/s]
 49%|████▉     | 705/1435 [00:57<00:54, 13.28it/s]
 49%|████▉     | 707/1435 [00:57<00:54, 13.27it/s]
 49%|████▉     | 709/1435 [00:58<00:54, 13.24it/s]
 50%|████▉     | 711/1435 [00:58<00:54, 13.25it/s]
 50%|████▉     | 713/1435 [00:58<00:54, 13.26it/s]
 50%|████▉     | 715/1435 [00:58<00:54, 13.23it/s]
 50%|████▉     | 717/1435 [00:58<00:54, 13.26it/s]
 50%|█████     | 719/1435 [00:58<00:53, 13.29it/s]
 50%|█████     | 721/1435 [00:59<00:53, 13.27it/s]
 50%|█████     | 723/1435 [00:59<00:53, 13.23it/s]
 51%|█████     | 725/1435 [00:59<00:53, 13.25it/s]
 51%|█████     | 727/1435 [00:59<00:53, 13.26it/s]
 51%|█████     | 729/1435 [00:59<00:53, 13.27it/s]
 51%|█████     | 731/1435 [00:59<00:52, 13.31it/s]
 51%|█████     | 733/1435 [00:5

== Status ==
Current time: 2024-03-07 21:29:23 (running for 00:04:12.91)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 53%|█████▎    | 761/1435 [01:02<00:50, 13.32it/s]
 53%|█████▎    | 763/1435 [01:02<00:50, 13.29it/s]
 53%|█████▎    | 765/1435 [01:02<00:50, 13.30it/s]
 53%|█████▎    | 767/1435 [01:02<00:50, 13.35it/s]
 54%|█████▎    | 769/1435 [01:02<00:50, 13.28it/s]
 54%|█████▎    | 771/1435 [01:02<00:49, 13.29it/s]
 54%|█████▍    | 773/1435 [01:02<00:49, 13.34it/s]
 54%|█████▍    | 775/1435 [01:03<00:49, 13.33it/s]
 54%|█████▍    | 777/1435 [01:03<00:49, 13.28it/s]
 54%|█████▍    | 779/1435 [01:03<00:49, 13.31it/s]
 54%|█████▍    | 781/1435 [01:03<00:49, 13.30it/s]
 55%|█████▍    | 783/1435 [01:03<00:49, 13.20it/s]
 55%|█████▍    | 785/1435 [01:03<00:49, 13.21it/s]
 55%|█████▍    | 787/1435 [01:04<00:49, 13.07it/s]
 55%|█████▍    | 789/1435 [01:04<00:48, 13.21it/s]
 55%|█████▌    | 791/1435 [01:04<00:48, 13.16it/s]
 55%|█████▌    | 793/1435 [01:04<00:48, 13.23it/s]
 55%|█████▌    | 795/1435 [01:04<00:48, 13.23it/s]
 56%|█████▌    | 797/1435 [01:04<00:47, 13.30it/s]
 56%|█████▌    | 799/1435 [01:0

== Status ==
Current time: 2024-03-07 21:29:28 (running for 00:04:17.95)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 58%|█████▊    | 829/1435 [01:07<00:45, 13.45it/s]
 58%|█████▊    | 831/1435 [01:07<00:44, 13.51it/s]
 58%|█████▊    | 833/1435 [01:07<00:44, 13.58it/s]
 58%|█████▊    | 835/1435 [01:07<00:44, 13.44it/s]
 58%|█████▊    | 837/1435 [01:07<00:45, 13.22it/s]
 58%|█████▊    | 839/1435 [01:07<00:46, 12.94it/s]
 59%|█████▊    | 841/1435 [01:08<00:45, 13.09it/s]
 59%|█████▊    | 843/1435 [01:08<00:45, 13.04it/s]
 59%|█████▉    | 845/1435 [01:08<00:44, 13.12it/s]
 59%|█████▉    | 847/1435 [01:08<00:44, 13.13it/s]
 59%|█████▉    | 849/1435 [01:08<00:44, 13.21it/s]
 59%|█████▉    | 851/1435 [01:08<00:44, 13.23it/s]
 59%|█████▉    | 853/1435 [01:09<00:43, 13.30it/s]
 60%|█████▉    | 855/1435 [01:09<00:43, 13.34it/s]
 60%|█████▉    | 857/1435 [01:09<00:43, 13.35it/s]
 60%|█████▉    | 859/1435 [01:09<00:43, 13.32it/s]
 60%|██████    | 861/1435 [01:09<00:43, 13.31it/s]
[36m(_objective pid=8488)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=8488)[0m 
 40%|████      | 2/5 [00:00<

[36m(_objective pid=8488)[0m {'eval_loss': 0.6817010045051575, 'eval_accuracy': 0.6329113924050633, 'eval_runtime': 1.3569, 'eval_samples_per_second': 58.222, 'eval_steps_per_second': 3.685, 'epoch': 3.0}


[36m(_objective pid=8488)[0m 
                                                  
 60%|██████    | 861/1435 [01:10<00:43, 13.31it/s]
100%|██████████| 5/5 [00:01<00:00,  4.29it/s][A
                                             [A
 60%|██████    | 863/1435 [01:11<02:39,  3.59it/s]
 60%|██████    | 865/1435 [01:11<02:04,  4.59it/s]
 60%|██████    | 867/1435 [01:11<01:39,  5.72it/s]
 61%|██████    | 869/1435 [01:11<01:22,  6.89it/s]
 61%|██████    | 871/1435 [01:11<01:10,  8.05it/s]
 61%|██████    | 873/1435 [01:11<01:01,  9.12it/s]
 61%|██████    | 875/1435 [01:12<00:55, 10.09it/s]


== Status ==
Current time: 2024-03-07 21:29:33 (running for 00:04:22.97)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 61%|██████    | 877/1435 [01:12<00:51, 10.86it/s]
 61%|██████▏   | 879/1435 [01:12<00:48, 11.49it/s]
 61%|██████▏   | 881/1435 [01:12<00:46, 11.96it/s]
 62%|██████▏   | 883/1435 [01:12<00:44, 12.36it/s]
 62%|██████▏   | 885/1435 [01:12<00:43, 12.61it/s]
 62%|██████▏   | 887/1435 [01:12<00:42, 12.83it/s]
 62%|██████▏   | 889/1435 [01:13<00:42, 12.91it/s]
 62%|██████▏   | 891/1435 [01:13<00:41, 13.00it/s]
 62%|██████▏   | 893/1435 [01:13<00:41, 13.07it/s]
 62%|██████▏   | 895/1435 [01:13<00:41, 13.13it/s]
 63%|██████▎   | 897/1435 [01:13<00:41, 13.10it/s]
 63%|██████▎   | 899/1435 [01:13<00:40, 13.19it/s]
 63%|██████▎   | 901/1435 [01:13<00:40, 13.19it/s]
 63%|██████▎   | 903/1435 [01:14<00:40, 13.24it/s]
 63%|██████▎   | 905/1435 [01:14<00:40, 13.18it/s]
 63%|██████▎   | 907/1435 [01:14<00:39, 13.26it/s]
 63%|██████▎   | 909/1435 [01:14<00:39, 13.23it/s]
 63%|██████▎   | 911/1435 [01:14<00:39, 13.24it/s]
 64%|██████▎   | 913/1435 [01:14<00:39, 13.25it/s]
 64%|██████▍   | 915/1435 [01:1

== Status ==
Current time: 2024-03-07 21:29:38 (running for 00:04:28.01)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 66%|██████▌   | 943/1435 [01:17<00:36, 13.30it/s]
 66%|██████▌   | 945/1435 [01:17<00:36, 13.28it/s]
 66%|██████▌   | 947/1435 [01:17<00:36, 13.31it/s]
 66%|██████▌   | 949/1435 [01:17<00:36, 13.22it/s]
 66%|██████▋   | 951/1435 [01:17<00:36, 13.27it/s]
 66%|██████▋   | 953/1435 [01:17<00:36, 13.28it/s]
 67%|██████▋   | 955/1435 [01:18<00:36, 13.27it/s]
 67%|██████▋   | 957/1435 [01:18<00:35, 13.29it/s]
 67%|██████▋   | 959/1435 [01:18<00:35, 13.28it/s]
 67%|██████▋   | 961/1435 [01:18<00:35, 13.29it/s]
 67%|██████▋   | 963/1435 [01:18<00:35, 13.22it/s]
 67%|██████▋   | 965/1435 [01:18<00:35, 13.18it/s]
 67%|██████▋   | 967/1435 [01:18<00:35, 13.25it/s]
 68%|██████▊   | 969/1435 [01:19<00:35, 13.22it/s]
 68%|██████▊   | 971/1435 [01:19<00:35, 13.21it/s]
 68%|██████▊   | 973/1435 [01:19<00:34, 13.21it/s]
 68%|██████▊   | 975/1435 [01:19<00:34, 13.24it/s]
 68%|██████▊   | 977/1435 [01:19<00:34, 13.23it/s]
 68%|██████▊   | 979/1435 [01:19<00:34, 13.25it/s]
 68%|██████▊   | 981/1435 [01:2

[36m(_objective pid=8488)[0m {'loss': 0.6779, 'grad_norm': 12.433586120605469, 'learning_rate': 3.9609976087478676e-07, 'epoch': 3.48}
== Status ==
Current time: 2024-03-07 21:29:43 (running for 00:04:33.05)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+-----------------

 70%|██████▉   | 1001/1435 [01:23<02:18,  3.12it/s]
 70%|██████▉   | 1003/1435 [01:23<01:46,  4.05it/s]
 70%|███████   | 1005/1435 [01:23<01:24,  5.12it/s]
 70%|███████   | 1007/1435 [01:23<01:08,  6.27it/s]
 70%|███████   | 1009/1435 [01:23<00:57,  7.46it/s]
 70%|███████   | 1011/1435 [01:23<00:49,  8.58it/s]
 71%|███████   | 1013/1435 [01:24<00:43,  9.62it/s]
 71%|███████   | 1015/1435 [01:24<00:40, 10.49it/s]
 71%|███████   | 1017/1435 [01:24<00:37, 11.20it/s]
 71%|███████   | 1019/1435 [01:24<00:35, 11.71it/s]
 71%|███████   | 1021/1435 [01:24<00:34, 12.17it/s]
 71%|███████▏  | 1023/1435 [01:24<00:33, 12.46it/s]
 71%|███████▏  | 1025/1435 [01:24<00:32, 12.74it/s]
 72%|███████▏  | 1027/1435 [01:25<00:31, 12.91it/s]
 72%|███████▏  | 1029/1435 [01:25<00:31, 13.05it/s]
 72%|███████▏  | 1031/1435 [01:25<00:30, 13.07it/s]
 72%|███████▏  | 1033/1435 [01:25<00:30, 13.15it/s]
 72%|███████▏  | 1035/1435 [01:25<00:30, 13.12it/s]
 72%|███████▏  | 1037/1435 [01:25<00:30, 13.18it/s]
 72%|███████

== Status ==
Current time: 2024-03-07 21:29:49 (running for 00:04:38.09)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 74%|███████▎  | 1055/1435 [01:27<00:28, 13.27it/s]
 74%|███████▎  | 1057/1435 [01:27<00:28, 13.26it/s]
 74%|███████▍  | 1059/1435 [01:27<00:28, 13.23it/s]
 74%|███████▍  | 1061/1435 [01:27<00:28, 13.26it/s]
 74%|███████▍  | 1063/1435 [01:27<00:28, 13.27it/s]
 74%|███████▍  | 1065/1435 [01:27<00:27, 13.22it/s]
 74%|███████▍  | 1067/1435 [01:28<00:27, 13.23it/s]
 74%|███████▍  | 1069/1435 [01:28<00:27, 13.29it/s]
 75%|███████▍  | 1071/1435 [01:28<00:27, 13.28it/s]
 75%|███████▍  | 1073/1435 [01:28<00:27, 13.30it/s]
 75%|███████▍  | 1075/1435 [01:28<00:27, 13.28it/s]
 75%|███████▌  | 1077/1435 [01:28<00:26, 13.33it/s]
 75%|███████▌  | 1079/1435 [01:29<00:26, 13.34it/s]
 75%|███████▌  | 1081/1435 [01:29<00:26, 13.29it/s]
 75%|███████▌  | 1083/1435 [01:29<00:26, 13.28it/s]
 76%|███████▌  | 1085/1435 [01:29<00:26, 13.28it/s]
 76%|███████▌  | 1087/1435 [01:29<00:26, 13.27it/s]
 76%|███████▌  | 1089/1435 [01:29<00:25, 13.32it/s]
 76%|███████▌  | 1091/1435 [01:29<00:25, 13.27it/s]
 76%|███████

== Status ==
Current time: 2024-03-07 21:29:54 (running for 00:04:43.13)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 78%|███████▊  | 1123/1435 [01:32<00:23, 13.15it/s]
 78%|███████▊  | 1125/1435 [01:32<00:23, 13.18it/s]
 79%|███████▊  | 1127/1435 [01:32<00:23, 13.15it/s]
 79%|███████▊  | 1129/1435 [01:32<00:23, 13.23it/s]
 79%|███████▉  | 1131/1435 [01:32<00:23, 13.21it/s]
 79%|███████▉  | 1133/1435 [01:33<00:22, 13.28it/s]
 79%|███████▉  | 1135/1435 [01:33<00:22, 13.26it/s]
 79%|███████▉  | 1137/1435 [01:33<00:22, 13.29it/s]
 79%|███████▉  | 1139/1435 [01:33<00:22, 13.24it/s]
 80%|███████▉  | 1141/1435 [01:33<00:22, 13.26it/s]
 80%|███████▉  | 1143/1435 [01:33<00:22, 13.23it/s]
 80%|███████▉  | 1145/1435 [01:34<00:21, 13.27it/s]
 80%|███████▉  | 1147/1435 [01:34<00:21, 13.26it/s]
[36m(_objective pid=8488)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=8488)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.29it/s][A
[36m(_objective pid=8488)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.12it/s][A
[36m(_objective pid=8488)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.46it/s][A


[36m(_objective pid=8488)[0m {'eval_loss': 0.6829280853271484, 'eval_accuracy': 0.5569620253164557, 'eval_runtime': 1.3605, 'eval_samples_per_second': 58.065, 'eval_steps_per_second': 3.675, 'epoch': 4.0}


[36m(_objective pid=8488)[0m 
                                                   
 80%|████████  | 1148/1435 [01:35<00:21, 13.26it/s]
100%|██████████| 5/5 [00:01<00:00,  4.28it/s][A
                                             [A
 80%|████████  | 1149/1435 [01:35<01:19,  3.59it/s]
 80%|████████  | 1151/1435 [01:35<01:02,  4.57it/s]
 80%|████████  | 1153/1435 [01:35<00:49,  5.69it/s]
 80%|████████  | 1155/1435 [01:36<00:40,  6.88it/s]
 81%|████████  | 1157/1435 [01:36<00:34,  8.03it/s]
 81%|████████  | 1159/1435 [01:36<00:30,  9.14it/s]
 81%|████████  | 1161/1435 [01:36<00:27, 10.04it/s]
 81%|████████  | 1163/1435 [01:36<00:25, 10.87it/s]
 81%|████████  | 1165/1435 [01:36<00:23, 11.48it/s]
 81%|████████▏ | 1167/1435 [01:37<00:22, 12.01it/s]
 81%|████████▏ | 1169/1435 [01:37<00:21, 12.38it/s]


== Status ==
Current time: 2024-03-07 21:29:59 (running for 00:04:48.20)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 82%|████████▏ | 1171/1435 [01:37<00:20, 12.62it/s]
 82%|████████▏ | 1173/1435 [01:37<00:20, 12.74it/s]
 82%|████████▏ | 1175/1435 [01:37<00:20, 12.91it/s]
 82%|████████▏ | 1177/1435 [01:37<00:19, 13.03it/s]
 82%|████████▏ | 1179/1435 [01:37<00:19, 13.10it/s]
 82%|████████▏ | 1181/1435 [01:38<00:19, 13.14it/s]
 82%|████████▏ | 1183/1435 [01:38<00:19, 13.21it/s]
 83%|████████▎ | 1185/1435 [01:38<00:18, 13.19it/s]
 83%|████████▎ | 1187/1435 [01:38<00:18, 13.14it/s]
 83%|████████▎ | 1189/1435 [01:38<00:18, 13.14it/s]
 83%|████████▎ | 1191/1435 [01:38<00:18, 13.21it/s]
 83%|████████▎ | 1193/1435 [01:39<00:18, 13.21it/s]
 83%|████████▎ | 1195/1435 [01:39<00:18, 13.23it/s]
 83%|████████▎ | 1197/1435 [01:39<00:17, 13.23it/s]
 84%|████████▎ | 1199/1435 [01:39<00:17, 13.28it/s]
 84%|████████▎ | 1201/1435 [01:39<00:17, 13.22it/s]
 84%|████████▍ | 1203/1435 [01:39<00:17, 13.20it/s]
 84%|████████▍ | 1205/1435 [01:39<00:17, 13.21it/s]
 84%|████████▍ | 1207/1435 [01:40<00:17, 13.27it/s]
 84%|███████

== Status ==
Current time: 2024-03-07 21:30:04 (running for 00:04:53.24)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 86%|████████▋ | 1239/1435 [01:42<00:14, 13.21it/s]
 86%|████████▋ | 1241/1435 [01:42<00:14, 13.24it/s]
 87%|████████▋ | 1243/1435 [01:42<00:14, 13.23it/s]
 87%|████████▋ | 1245/1435 [01:43<00:14, 13.28it/s]
 87%|████████▋ | 1247/1435 [01:43<00:14, 13.20it/s]
 87%|████████▋ | 1249/1435 [01:43<00:14, 13.26it/s]
 87%|████████▋ | 1251/1435 [01:43<00:13, 13.27it/s]
 87%|████████▋ | 1253/1435 [01:43<00:13, 13.22it/s]
 87%|████████▋ | 1255/1435 [01:43<00:13, 13.23it/s]
 88%|████████▊ | 1257/1435 [01:43<00:13, 13.30it/s]
 88%|████████▊ | 1259/1435 [01:44<00:13, 13.28it/s]
 88%|████████▊ | 1261/1435 [01:44<00:13, 13.25it/s]
 88%|████████▊ | 1263/1435 [01:44<00:13, 13.23it/s]
 88%|████████▊ | 1265/1435 [01:44<00:12, 13.28it/s]
 88%|████████▊ | 1267/1435 [01:44<00:12, 13.19it/s]
 88%|████████▊ | 1269/1435 [01:44<00:12, 13.21it/s]
 89%|████████▊ | 1271/1435 [01:44<00:12, 13.22it/s]
 89%|████████▉ | 1275/1435 [01:45<00:12, 13.21it/s]
 89%|████████▉ | 1277/1435 [01:46<00:25,  6.15it/s]
 89%|███████

== Status ==
Current time: 2024-03-07 21:30:09 (running for 00:04:58.28)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 90%|█████████ | 1295/1435 [01:47<00:11, 12.43it/s]
 90%|█████████ | 1297/1435 [01:47<00:10, 12.72it/s]
 91%|█████████ | 1299/1435 [01:47<00:10, 12.84it/s]
 91%|█████████ | 1301/1435 [01:47<00:10, 12.95it/s]
 91%|█████████ | 1303/1435 [01:47<00:10, 13.05it/s]
 91%|█████████ | 1305/1435 [01:48<00:09, 13.17it/s]
 91%|█████████ | 1307/1435 [01:48<00:09, 13.19it/s]
 91%|█████████ | 1309/1435 [01:48<00:09, 13.24it/s]
 91%|█████████▏| 1311/1435 [01:48<00:09, 13.23it/s]
 91%|█████████▏| 1313/1435 [01:48<00:09, 13.29it/s]
 92%|█████████▏| 1315/1435 [01:48<00:09, 13.28it/s]
 92%|█████████▏| 1317/1435 [01:49<00:08, 13.26it/s]
 92%|█████████▏| 1319/1435 [01:49<00:08, 13.27it/s]
 92%|█████████▏| 1321/1435 [01:49<00:08, 13.31it/s]
 92%|█████████▏| 1323/1435 [01:49<00:08, 13.30it/s]
 92%|█████████▏| 1325/1435 [01:49<00:08, 13.26it/s]
 92%|█████████▏| 1327/1435 [01:49<00:08, 13.24it/s]
 93%|█████████▎| 1329/1435 [01:49<00:07, 13.27it/s]
 93%|█████████▎| 1331/1435 [01:50<00:07, 13.21it/s]
 93%|███████

== Status ==
Current time: 2024-03-07 21:30:14 (running for 00:05:03.32)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

 95%|█████████▌| 1365/1435 [01:52<00:05, 13.22it/s]
 95%|█████████▌| 1367/1435 [01:52<00:05, 13.24it/s]
 95%|█████████▌| 1369/1435 [01:52<00:04, 13.25it/s]
 96%|█████████▌| 1371/1435 [01:53<00:04, 13.28it/s]
 96%|█████████▌| 1373/1435 [01:53<00:04, 13.30it/s]
 96%|█████████▌| 1375/1435 [01:53<00:04, 13.30it/s]
 96%|█████████▌| 1377/1435 [01:53<00:04, 13.28it/s]
 96%|█████████▌| 1379/1435 [01:53<00:04, 13.24it/s]
 96%|█████████▌| 1381/1435 [01:53<00:04, 13.26it/s]
 96%|█████████▋| 1383/1435 [01:54<00:03, 13.27it/s]
 97%|█████████▋| 1385/1435 [01:54<00:03, 13.29it/s]
 97%|█████████▋| 1387/1435 [01:54<00:03, 13.28it/s]
 97%|█████████▋| 1389/1435 [01:54<00:03, 13.29it/s]
 97%|█████████▋| 1391/1435 [01:54<00:03, 13.23it/s]
 97%|█████████▋| 1393/1435 [01:54<00:03, 13.24it/s]
 97%|█████████▋| 1395/1435 [01:54<00:03, 13.21it/s]
 97%|█████████▋| 1397/1435 [01:55<00:02, 13.24it/s]
 97%|█████████▋| 1399/1435 [01:55<00:02, 13.20it/s]
 98%|█████████▊| 1401/1435 [01:55<00:02, 13.23it/s]
 98%|███████

== Status ==
Current time: 2024-03-07 21:30:19 (running for 00:05:08.36)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 1 RUNNING, 2 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00002 | RUNNING    | 172.19.0.1:8488 |     1.30667e-06 | 

100%|█████████▉| 1431/1435 [01:57<00:00, 13.29it/s]
100%|█████████▉| 1433/1435 [01:57<00:00, 13.29it/s]
100%|██████████| 1435/1435 [01:57<00:00, 13.31it/s]
[36m(_objective pid=8488)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=8488)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.25it/s][A
[36m(_objective pid=8488)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.10it/s][A
[36m(_objective pid=8488)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.47it/s][A


[36m(_objective pid=8488)[0m {'eval_loss': 0.6818103790283203, 'eval_accuracy': 0.5822784810126582, 'eval_runtime': 1.3609, 'eval_samples_per_second': 58.051, 'eval_steps_per_second': 3.674, 'epoch': 5.0}
[36m(_objective pid=8488)[0m {'train_runtime': 119.3165, 'train_samples_per_second': 12.027, 'train_steps_per_second': 12.027, 'train_loss': 0.6823294716014264, 'epoch': 5.0}


[36m(_objective pid=8488)[0m 
                                                   
100%|██████████| 1435/1435 [01:59<00:00, 13.31it/s]
100%|██████████| 5/5 [00:01<00:00,  4.28it/s][A
100%|██████████| 1435/1435 [01:59<00:00, 12.03it/s]


== Status ==
Current time: 2024-03-07 21:30:24 (running for 00:05:13.42)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (12 PENDING, 3 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00003 | PENDING    |                 |     8.70602e-05 |            

[36m(_objective pid=9019)[0m 2024-03-07 21:30:26.567418: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=9019)[0m 2024-03-07 21:30:26.567473: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=9019)[0m 2024-03-07 21:30:26.568815: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered


== Status ==
Current time: 2024-03-07 21:30:29 (running for 00:05:18.44)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (11 PENDING, 1 RUNNING, 3 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00003 | RUNNING    | 172.19.0.1:9019 |     8.70602e-05 | 

[36m(_objective pid=9019)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
[36m(_objective pid=9019)[0m You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
  0%|          | 0/216 [00:00<?, ?it/s]
  0%|          | 1/216 [00:00<01:28,  2.44it/s]
  1%|          | 2/216 [00:00<00:59,  3.60it/s]
  1%|▏         | 3/216 [00:00<00:51,  4.11it/s]
  2%|▏         | 4/216 [00:01<00:48,  4.40it/s]
  2%|▏         | 5/216 [00:01<00:46,  4.57it/s]
  3%|▎         | 6/216 [00:01<00:45,  4.66it/s]
  3%|▎         | 7/216 [00:01<00:44,  4.74it/s]
  4%|▎         | 8/216 [00:01<00:43,  4.80it/s]
  4%|▍         | 9/216 [00:02<00:42,  4.84it/s]
  5%|▍         | 10/216 [00:02<00:42,  4.86it/s]
  5%|▌         | 11/216 [00:02<00:41,  4.89it/s]
  6%|▌         

== Status ==
Current time: 2024-03-07 21:30:34 (running for 00:05:23.48)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (11 PENDING, 1 RUNNING, 3 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00003 | RUNNING    | 172.19.0.1:9019 |     8.70602e-05 | 

 10%|█         | 22/216 [00:04<00:39,  4.92it/s]
 11%|█         | 23/216 [00:04<00:39,  4.91it/s]
 11%|█         | 24/216 [00:05<00:38,  4.93it/s]
 12%|█▏        | 25/216 [00:05<00:38,  4.92it/s]
 12%|█▏        | 26/216 [00:05<00:38,  4.93it/s]
 12%|█▎        | 27/216 [00:05<00:38,  4.94it/s]
 13%|█▎        | 28/216 [00:05<00:38,  4.93it/s]
 13%|█▎        | 29/216 [00:06<00:38,  4.91it/s]
 14%|█▍        | 30/216 [00:06<00:37,  4.93it/s]
 14%|█▍        | 31/216 [00:06<00:37,  4.93it/s]
 15%|█▍        | 32/216 [00:06<00:37,  4.93it/s]
 15%|█▌        | 33/216 [00:06<00:37,  4.93it/s]
 16%|█▌        | 34/216 [00:07<00:36,  4.93it/s]
 16%|█▌        | 35/216 [00:07<00:36,  4.91it/s]
 17%|█▋        | 36/216 [00:07<00:36,  4.92it/s]
 17%|█▋        | 37/216 [00:07<00:36,  4.92it/s]
 18%|█▊        | 38/216 [00:07<00:36,  4.92it/s]
 18%|█▊        | 39/216 [00:08<00:35,  4.93it/s]
 19%|█▊        | 40/216 [00:08<00:35,  4.93it/s]
 19%|█▉        | 41/216 [00:08<00:35,  4.92it/s]
 19%|█▉        | 42/

== Status ==
Current time: 2024-03-07 21:30:39 (running for 00:05:28.51)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (11 PENDING, 1 RUNNING, 3 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00003 | RUNNING    | 172.19.0.1:9019 |     8.70602e-05 | 

 22%|██▏       | 47/216 [00:09<00:34,  4.91it/s]
 22%|██▏       | 48/216 [00:09<00:34,  4.90it/s]
 23%|██▎       | 49/216 [00:10<00:33,  4.92it/s]
 23%|██▎       | 50/216 [00:10<00:33,  4.92it/s]
 24%|██▎       | 51/216 [00:10<00:33,  4.90it/s]
 24%|██▍       | 52/216 [00:10<00:33,  4.91it/s]
 25%|██▍       | 53/216 [00:10<00:33,  4.91it/s]
 25%|██▌       | 54/216 [00:11<00:32,  4.91it/s]
 25%|██▌       | 55/216 [00:11<00:32,  4.93it/s]
 26%|██▌       | 56/216 [00:11<00:32,  4.90it/s]
 26%|██▋       | 57/216 [00:11<00:32,  4.90it/s]
 27%|██▋       | 58/216 [00:11<00:32,  4.92it/s]
 27%|██▋       | 59/216 [00:12<00:31,  4.92it/s]
 28%|██▊       | 60/216 [00:12<00:31,  4.93it/s]
 28%|██▊       | 61/216 [00:12<00:31,  4.94it/s]
 29%|██▊       | 62/216 [00:12<00:31,  4.93it/s]
 29%|██▉       | 63/216 [00:12<00:31,  4.92it/s]
 30%|██▉       | 64/216 [00:13<00:30,  4.93it/s]
 30%|███       | 65/216 [00:13<00:30,  4.94it/s]
 31%|███       | 66/216 [00:13<00:30,  4.92it/s]
 31%|███       | 67/

== Status ==
Current time: 2024-03-07 21:30:44 (running for 00:05:33.55)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (11 PENDING, 1 RUNNING, 3 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00003 | RUNNING    | 172.19.0.1:9019 |     8.70602e-05 | 

 33%|███▎      | 71/216 [00:14<00:29,  4.94it/s]
 33%|███▎      | 72/216 [00:14<00:27,  5.25it/s]
[36m(_objective pid=9019)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=9019)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.25it/s][A
[36m(_objective pid=9019)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.14it/s][A
[36m(_objective pid=9019)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.47it/s][A
[36m(_objective pid=9019)[0m 
                                                
 33%|███▎      | 72/216 [00:16<00:27,  5.25it/s]
100%|██████████| 5/5 [00:01<00:00,  4.28it/s][A
                                             [A


[36m(_objective pid=9019)[0m {'eval_loss': 0.6790513396263123, 'eval_accuracy': 0.5822784810126582, 'eval_runtime': 1.3601, 'eval_samples_per_second': 58.086, 'eval_steps_per_second': 3.676, 'epoch': 1.0}


 34%|███▍      | 73/216 [00:16<01:26,  1.65it/s]
 34%|███▍      | 74/216 [00:16<01:08,  2.06it/s]
 35%|███▍      | 75/216 [00:16<00:56,  2.50it/s]
 35%|███▌      | 76/216 [00:16<00:47,  2.93it/s]
 36%|███▌      | 77/216 [00:17<00:41,  3.34it/s]
 36%|███▌      | 78/216 [00:17<00:37,  3.67it/s]
 37%|███▋      | 79/216 [00:17<00:34,  3.91it/s]
 37%|███▋      | 80/216 [00:17<00:32,  4.15it/s]
 38%|███▊      | 81/216 [00:18<00:30,  4.36it/s]
 38%|███▊      | 82/216 [00:18<00:29,  4.52it/s]
 38%|███▊      | 83/216 [00:18<00:28,  4.64it/s]
 39%|███▉      | 84/216 [00:18<00:27,  4.73it/s]
 39%|███▉      | 85/216 [00:18<00:27,  4.78it/s]
 40%|███▉      | 86/216 [00:19<00:26,  4.82it/s]
 40%|████      | 87/216 [00:19<00:26,  4.86it/s]
 41%|████      | 88/216 [00:19<00:26,  4.88it/s]
 41%|████      | 89/216 [00:19<00:25,  4.89it/s]


== Status ==
Current time: 2024-03-07 21:30:49 (running for 00:05:38.61)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (11 PENDING, 1 RUNNING, 3 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00003 | RUNNING    | 172.19.0.1:9019 |     8.70602e-05 | 

 42%|████▏     | 90/216 [00:19<00:25,  4.92it/s]
 42%|████▏     | 91/216 [00:20<00:25,  4.91it/s]
 43%|████▎     | 92/216 [00:20<00:25,  4.91it/s]
 43%|████▎     | 93/216 [00:20<00:24,  4.93it/s]
 44%|████▎     | 94/216 [00:20<00:24,  4.93it/s]
 44%|████▍     | 95/216 [00:20<00:24,  4.94it/s]
 44%|████▍     | 96/216 [00:21<00:24,  4.95it/s]
 45%|████▍     | 97/216 [00:21<00:24,  4.92it/s]
 45%|████▌     | 98/216 [00:21<00:23,  4.92it/s]
 46%|████▌     | 99/216 [00:21<00:23,  4.93it/s]
 46%|████▋     | 100/216 [00:21<00:23,  4.92it/s]
 47%|████▋     | 101/216 [00:22<00:23,  4.90it/s]
 47%|████▋     | 102/216 [00:22<00:23,  4.90it/s]
 48%|████▊     | 103/216 [00:22<00:22,  4.91it/s]
 48%|████▊     | 104/216 [00:22<00:22,  4.92it/s]
 49%|████▊     | 105/216 [00:22<00:22,  4.93it/s]
 49%|████▉     | 106/216 [00:23<00:22,  4.92it/s]
 50%|████▉     | 107/216 [00:23<00:22,  4.92it/s]
 50%|█████     | 108/216 [00:23<00:21,  4.93it/s]
 50%|█████     | 109/216 [00:23<00:21,  4.93it/s]
 51%|█████

== Status ==
Current time: 2024-03-07 21:30:54 (running for 00:05:43.64)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (11 PENDING, 1 RUNNING, 3 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00003 | RUNNING    | 172.19.0.1:9019 |     8.70602e-05 | 

 53%|█████▎    | 114/216 [00:24<00:20,  4.88it/s]
 53%|█████▎    | 115/216 [00:24<00:20,  4.91it/s]
 54%|█████▎    | 116/216 [00:25<00:20,  4.91it/s]
 54%|█████▍    | 117/216 [00:25<00:20,  4.91it/s]
 55%|█████▍    | 118/216 [00:25<00:19,  4.92it/s]
 55%|█████▌    | 119/216 [00:25<00:19,  4.91it/s]
 56%|█████▌    | 120/216 [00:25<00:19,  4.91it/s]
 56%|█████▌    | 121/216 [00:26<00:19,  4.92it/s]
 56%|█████▋    | 122/216 [00:26<00:19,  4.92it/s]
 57%|█████▋    | 123/216 [00:26<00:18,  4.92it/s]
 57%|█████▋    | 124/216 [00:26<00:18,  4.94it/s]
 58%|█████▊    | 125/216 [00:26<00:18,  4.93it/s]
 58%|█████▊    | 126/216 [00:27<00:18,  4.92it/s]
 59%|█████▉    | 127/216 [00:27<00:18,  4.94it/s]
 59%|█████▉    | 128/216 [00:27<00:17,  4.94it/s]
 60%|█████▉    | 129/216 [00:27<00:17,  4.93it/s]
 60%|██████    | 130/216 [00:27<00:17,  4.94it/s]
 61%|██████    | 131/216 [00:28<00:17,  4.92it/s]
 61%|██████    | 132/216 [00:28<00:17,  4.92it/s]
 62%|██████▏   | 133/216 [00:28<00:16,  4.92it/s]


== Status ==
Current time: 2024-03-07 21:30:59 (running for 00:05:48.68)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (11 PENDING, 1 RUNNING, 3 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00003 | RUNNING    | 172.19.0.1:9019 |     8.70602e-05 | 

 64%|██████▍   | 139/216 [00:29<00:15,  4.91it/s]
 65%|██████▍   | 140/216 [00:29<00:15,  4.92it/s]
 65%|██████▌   | 141/216 [00:30<00:15,  4.90it/s]
 66%|██████▌   | 142/216 [00:30<00:15,  4.91it/s]
 66%|██████▌   | 143/216 [00:30<00:14,  4.92it/s]
 67%|██████▋   | 144/216 [00:30<00:13,  5.21it/s]
[36m(_objective pid=9019)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=9019)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.21it/s][A
[36m(_objective pid=9019)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.12it/s][A
[36m(_objective pid=9019)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.45it/s][A
[36m(_objective pid=9019)[0m 
                                                 
 67%|██████▋   | 144/216 [00:32<00:13,  5.21it/s]
100%|██████████| 5/5 [00:01<00:00,  4.29it/s][A
                                             [A


[36m(_objective pid=9019)[0m {'eval_loss': 0.6784381866455078, 'eval_accuracy': 0.5822784810126582, 'eval_runtime': 1.3576, 'eval_samples_per_second': 58.191, 'eval_steps_per_second': 3.683, 'epoch': 2.0}


 67%|██████▋   | 145/216 [00:32<00:43,  1.65it/s]
 68%|██████▊   | 146/216 [00:32<00:33,  2.06it/s]
 68%|██████▊   | 147/216 [00:32<00:27,  2.49it/s]
 69%|██████▊   | 148/216 [00:32<00:23,  2.93it/s]
 69%|██████▉   | 149/216 [00:33<00:20,  3.33it/s]
 69%|██████▉   | 150/216 [00:33<00:17,  3.69it/s]
 70%|██████▉   | 151/216 [00:33<00:16,  3.99it/s]
 70%|███████   | 152/216 [00:33<00:15,  4.23it/s]
 71%|███████   | 153/216 [00:33<00:14,  4.42it/s]
 71%|███████▏  | 154/216 [00:34<00:13,  4.56it/s]
 72%|███████▏  | 155/216 [00:34<00:13,  4.66it/s]
 72%|███████▏  | 156/216 [00:34<00:12,  4.75it/s]


== Status ==
Current time: 2024-03-07 21:31:04 (running for 00:05:53.68)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (11 PENDING, 1 RUNNING, 3 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00003 | RUNNING    | 172.19.0.1:9019 |     8.70602e-05 | 

 73%|███████▎  | 157/216 [00:34<00:12,  4.78it/s]
 73%|███████▎  | 158/216 [00:34<00:12,  4.82it/s]
 74%|███████▎  | 159/216 [00:35<00:11,  4.85it/s]
 74%|███████▍  | 160/216 [00:35<00:11,  4.87it/s]
 75%|███████▍  | 161/216 [00:35<00:11,  4.89it/s]
 75%|███████▌  | 162/216 [00:35<00:11,  4.91it/s]
 75%|███████▌  | 163/216 [00:35<00:10,  4.91it/s]
 76%|███████▌  | 164/216 [00:36<00:10,  4.90it/s]
 76%|███████▋  | 165/216 [00:36<00:10,  4.91it/s]
 77%|███████▋  | 166/216 [00:36<00:10,  4.91it/s]
 77%|███████▋  | 167/216 [00:36<00:09,  4.90it/s]
 78%|███████▊  | 168/216 [00:37<00:09,  4.93it/s]
 78%|███████▊  | 169/216 [00:37<00:09,  4.91it/s]
 79%|███████▊  | 170/216 [00:37<00:09,  4.91it/s]
 79%|███████▉  | 171/216 [00:37<00:09,  4.92it/s]
 80%|███████▉  | 172/216 [00:37<00:08,  4.93it/s]
 80%|████████  | 173/216 [00:38<00:08,  4.94it/s]
 81%|████████  | 174/216 [00:38<00:08,  4.92it/s]
 81%|████████  | 175/216 [00:38<00:08,  4.92it/s]
 81%|████████▏ | 176/216 [00:38<00:08,  4.92it/s]


== Status ==
Current time: 2024-03-07 21:31:09 (running for 00:05:58.72)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (11 PENDING, 1 RUNNING, 3 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00003 | RUNNING    | 172.19.0.1:9019 |     8.70602e-05 | 

 84%|████████▍ | 182/216 [00:39<00:06,  4.89it/s]
 85%|████████▍ | 183/216 [00:40<00:06,  4.91it/s]
 85%|████████▌ | 184/216 [00:40<00:06,  4.91it/s]
 86%|████████▌ | 185/216 [00:40<00:06,  4.92it/s]
 86%|████████▌ | 186/216 [00:40<00:06,  4.92it/s]
 87%|████████▋ | 187/216 [00:40<00:05,  4.93it/s]
 87%|████████▋ | 188/216 [00:41<00:05,  4.93it/s]
 88%|████████▊ | 189/216 [00:41<00:05,  4.92it/s]
 88%|████████▊ | 190/216 [00:41<00:05,  4.93it/s]
 88%|████████▊ | 191/216 [00:41<00:05,  4.93it/s]
 89%|████████▉ | 192/216 [00:41<00:04,  4.92it/s]
 89%|████████▉ | 193/216 [00:42<00:04,  4.94it/s]
 90%|████████▉ | 194/216 [00:42<00:04,  4.94it/s]
 90%|█████████ | 195/216 [00:42<00:04,  4.94it/s]
 91%|█████████ | 196/216 [00:42<00:04,  4.95it/s]
 91%|█████████ | 197/216 [00:42<00:03,  4.94it/s]
 92%|█████████▏| 198/216 [00:43<00:03,  4.92it/s]
 92%|█████████▏| 199/216 [00:43<00:03,  4.93it/s]
 93%|█████████▎| 200/216 [00:43<00:03,  4.92it/s]
 93%|█████████▎| 201/216 [00:43<00:03,  4.93it/s]


== Status ==
Current time: 2024-03-07 21:31:14 (running for 00:06:03.77)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (11 PENDING, 1 RUNNING, 3 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00003 | RUNNING    | 172.19.0.1:9019 |     8.70602e-05 | 

 96%|█████████▌| 207/216 [00:44<00:01,  4.92it/s]
 96%|█████████▋| 208/216 [00:45<00:01,  4.93it/s]
 97%|█████████▋| 209/216 [00:45<00:01,  4.92it/s]
 97%|█████████▋| 210/216 [00:45<00:01,  4.93it/s]
 98%|█████████▊| 211/216 [00:45<00:01,  4.92it/s]
 98%|█████████▊| 212/216 [00:45<00:00,  4.94it/s]
 99%|█████████▊| 213/216 [00:46<00:00,  4.93it/s]
 99%|█████████▉| 214/216 [00:46<00:00,  4.91it/s]
100%|█████████▉| 215/216 [00:46<00:00,  4.91it/s]
100%|██████████| 216/216 [00:46<00:00,  5.21it/s]
[36m(_objective pid=9019)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=9019)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.27it/s][A
[36m(_objective pid=9019)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.12it/s][A
[36m(_objective pid=9019)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.47it/s][A
[36m(_objective pid=9019)[0m 
                                                 
100%|██████████| 216/216 [00:48<00:00,  5.21it/s]
100%|██████████| 5/5 [00:01<00:00,  4.30it/s][A
100

[36m(_objective pid=9019)[0m {'eval_loss': 0.6656137108802795, 'eval_accuracy': 0.6582278481012658, 'eval_runtime': 1.3564, 'eval_samples_per_second': 58.241, 'eval_steps_per_second': 3.686, 'epoch': 3.0}
[36m(_objective pid=9019)[0m {'train_runtime': 48.0977, 'train_samples_per_second': 17.901, 'train_steps_per_second': 4.491, 'train_loss': 0.6878061647768374, 'epoch': 3.0}
== Status ==
Current time: 2024-03-07 21:31:19 (running for 00:06:08.85)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (11 PENDING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|          

[36m(_objective pid=9203)[0m 2024-03-07 21:31:23.726897: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=9203)[0m 2024-03-07 21:31:23.726955: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=9203)[0m 2024-03-07 21:31:23.728359: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered


== Status ==
Current time: 2024-03-07 21:31:24 (running for 00:06:13.88)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

[36m(_objective pid=9203)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
[36m(_objective pid=9203)[0m You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
  0%|          | 0/861 [00:00<?, ?it/s]
  0%|          | 1/861 [00:00<04:13,  3.40it/s]
  0%|          | 3/861 [00:00<01:52,  7.61it/s]
  1%|          | 5/861 [00:00<01:28,  9.69it/s]
  1%|          | 7/861 [00:00<01:17, 10.95it/s]
  1%|          | 9/861 [00:00<01:12, 11.72it/s]
  1%|▏         | 11/861 [00:01<01:09, 12.15it/s]
  2%|▏         | 13/861 [00:01<01:07, 12.52it/s]
  2%|▏         | 15/861 [00:01<01:06, 12.71it/s]
  2%|▏         | 17/861 [00:01<01:05, 12.85it/s]
  2%|▏         | 19/861 [00:01<01:04, 12.98it/s]
  2%|▏         | 21/861 [00:01<01:04, 13.11it/s]
  3%|▎     

== Status ==
Current time: 2024-03-07 21:31:29 (running for 00:06:18.93)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

  4%|▍         | 35/861 [00:02<01:03, 13.00it/s]
  4%|▍         | 37/861 [00:03<01:03, 12.97it/s]
  5%|▍         | 39/861 [00:03<01:03, 13.04it/s]
  5%|▍         | 41/861 [00:03<01:02, 13.05it/s]
  5%|▍         | 43/861 [00:03<01:02, 13.05it/s]
  5%|▌         | 45/861 [00:03<01:02, 13.07it/s]
  5%|▌         | 47/861 [00:03<01:02, 13.05it/s]
  6%|▌         | 49/861 [00:03<01:02, 13.08it/s]
  6%|▌         | 51/861 [00:04<01:01, 13.08it/s]
  6%|▌         | 53/861 [00:04<01:01, 13.11it/s]
  6%|▋         | 55/861 [00:04<01:01, 13.07it/s]
  7%|▋         | 57/861 [00:04<01:01, 13.05it/s]
  7%|▋         | 59/861 [00:04<01:01, 13.02it/s]
  7%|▋         | 61/861 [00:04<01:01, 13.06it/s]
  7%|▋         | 63/861 [00:05<01:01, 13.03it/s]
  8%|▊         | 65/861 [00:05<01:00, 13.12it/s]
  8%|▊         | 67/861 [00:05<01:00, 13.11it/s]
  8%|▊         | 69/861 [00:05<01:00, 13.16it/s]
  8%|▊         | 71/861 [00:05<01:00, 13.10it/s]
  8%|▊         | 73/861 [00:05<00:59, 13.16it/s]
  9%|▊         | 75/

== Status ==
Current time: 2024-03-07 21:31:34 (running for 00:06:23.97)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

 12%|█▏        | 101/861 [00:07<00:57, 13.14it/s]
 12%|█▏        | 103/861 [00:08<00:57, 13.16it/s]
 12%|█▏        | 105/861 [00:08<00:57, 13.21it/s]
 12%|█▏        | 107/861 [00:08<00:57, 13.20it/s]
 13%|█▎        | 109/861 [00:08<00:57, 13.19it/s]
 13%|█▎        | 111/861 [00:08<00:56, 13.20it/s]
 13%|█▎        | 113/861 [00:08<00:56, 13.24it/s]
 13%|█▎        | 115/861 [00:08<00:56, 13.20it/s]
 14%|█▎        | 117/861 [00:09<00:56, 13.23it/s]
 14%|█▍        | 119/861 [00:09<00:56, 13.22it/s]
 14%|█▍        | 121/861 [00:09<00:55, 13.23it/s]
 14%|█▍        | 123/861 [00:09<00:55, 13.22it/s]
 15%|█▍        | 125/861 [00:09<00:55, 13.24it/s]
 15%|█▍        | 127/861 [00:09<00:55, 13.21it/s]
 15%|█▍        | 129/861 [00:10<00:55, 13.26it/s]
 15%|█▌        | 131/861 [00:10<00:55, 13.17it/s]
 15%|█▌        | 133/861 [00:10<00:55, 13.19it/s]
 16%|█▌        | 135/861 [00:10<00:55, 13.19it/s]
 16%|█▌        | 137/861 [00:10<00:54, 13.23it/s]
 16%|█▌        | 139/861 [00:10<00:54, 13.19it/s]


== Status ==
Current time: 2024-03-07 21:31:39 (running for 00:06:29.01)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

 20%|█▉        | 171/861 [00:13<00:50, 13.64it/s]
 20%|██        | 173/861 [00:13<00:50, 13.74it/s]
 20%|██        | 175/861 [00:13<00:49, 13.79it/s]
 21%|██        | 177/861 [00:13<00:49, 13.82it/s]
 21%|██        | 179/861 [00:13<00:49, 13.87it/s]
 21%|██        | 181/861 [00:13<00:48, 13.91it/s]
 21%|██▏       | 183/861 [00:14<00:48, 13.93it/s]
 21%|██▏       | 185/861 [00:14<00:48, 13.96it/s]
 22%|██▏       | 187/861 [00:14<00:48, 13.99it/s]
 22%|██▏       | 189/861 [00:14<00:48, 13.99it/s]
 22%|██▏       | 191/861 [00:14<00:47, 14.01it/s]
 22%|██▏       | 193/861 [00:14<00:48, 13.87it/s]
 23%|██▎       | 195/861 [00:14<00:47, 13.91it/s]
 23%|██▎       | 197/861 [00:15<00:47, 13.95it/s]
 23%|██▎       | 199/861 [00:15<00:47, 13.97it/s]
 23%|██▎       | 201/861 [00:15<00:47, 13.99it/s]
 24%|██▎       | 203/861 [00:15<00:47, 13.98it/s]
 24%|██▍       | 205/861 [00:15<00:46, 13.99it/s]
 24%|██▍       | 207/861 [00:15<00:46, 13.98it/s]
 24%|██▍       | 209/861 [00:15<00:46, 13.94it/s]


== Status ==
Current time: 2024-03-07 21:31:44 (running for 00:06:34.05)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

 28%|██▊       | 241/861 [00:18<00:44, 13.94it/s]
 28%|██▊       | 243/861 [00:18<00:44, 13.90it/s]
 28%|██▊       | 245/861 [00:18<00:44, 13.92it/s]
 29%|██▊       | 247/861 [00:18<00:43, 13.96it/s]
 29%|██▉       | 249/861 [00:18<00:44, 13.84it/s]
 29%|██▉       | 251/861 [00:18<00:43, 13.91it/s]
 29%|██▉       | 253/861 [00:19<00:43, 13.96it/s]
 30%|██▉       | 255/861 [00:19<00:43, 13.97it/s]
 30%|██▉       | 257/861 [00:19<00:43, 13.94it/s]
 30%|███       | 259/861 [00:19<00:43, 13.96it/s]
 30%|███       | 261/861 [00:19<00:42, 13.97it/s]
 31%|███       | 263/861 [00:19<00:42, 13.98it/s]
 31%|███       | 265/861 [00:19<00:42, 14.01it/s]
 31%|███       | 267/861 [00:20<00:42, 14.03it/s]
 31%|███       | 269/861 [00:20<00:42, 14.01it/s]
 31%|███▏      | 271/861 [00:20<00:42, 14.01it/s]
 32%|███▏      | 273/861 [00:20<00:42, 13.96it/s]
 32%|███▏      | 275/861 [00:20<00:41, 13.99it/s]
 32%|███▏      | 277/861 [00:20<00:42, 13.89it/s]
 32%|███▏      | 279/861 [00:20<00:41, 13.94it/s]


[36m(_objective pid=9203)[0m {'eval_loss': 0.6846276521682739, 'eval_accuracy': 0.5822784810126582, 'eval_runtime': 1.3097, 'eval_samples_per_second': 60.32, 'eval_steps_per_second': 3.818, 'epoch': 1.0}


 34%|███▍      | 291/861 [00:23<01:59,  4.78it/s]


== Status ==
Current time: 2024-03-07 21:31:50 (running for 00:06:39.11)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

 34%|███▍      | 293/861 [00:23<01:35,  5.96it/s]
 34%|███▍      | 295/861 [00:23<01:18,  7.20it/s]
 34%|███▍      | 297/861 [00:23<01:06,  8.43it/s]
 35%|███▍      | 299/861 [00:23<00:58,  9.57it/s]
 35%|███▍      | 301/861 [00:23<00:53, 10.55it/s]
 35%|███▌      | 303/861 [00:23<00:49, 11.31it/s]
 35%|███▌      | 305/861 [00:24<00:46, 11.92it/s]
 36%|███▌      | 307/861 [00:24<00:44, 12.39it/s]
 36%|███▌      | 309/861 [00:24<00:42, 12.84it/s]
 36%|███▌      | 311/861 [00:24<00:41, 13.13it/s]
 36%|███▋      | 313/861 [00:24<00:40, 13.38it/s]
 37%|███▋      | 315/861 [00:24<00:40, 13.47it/s]
 37%|███▋      | 317/861 [00:24<00:39, 13.62it/s]
 37%|███▋      | 319/861 [00:25<00:39, 13.71it/s]
 37%|███▋      | 321/861 [00:25<00:39, 13.80it/s]
 38%|███▊      | 323/861 [00:25<00:38, 13.85it/s]
 38%|███▊      | 325/861 [00:25<00:38, 13.88it/s]
 38%|███▊      | 327/861 [00:25<00:38, 13.91it/s]
 38%|███▊      | 329/861 [00:25<00:38, 13.96it/s]
 38%|███▊      | 331/861 [00:25<00:37, 13.99it/s]


== Status ==
Current time: 2024-03-07 21:31:55 (running for 00:06:44.15)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

 42%|████▏     | 363/861 [00:28<00:35, 13.93it/s]
 42%|████▏     | 365/861 [00:28<00:35, 13.96it/s]
 43%|████▎     | 367/861 [00:28<00:35, 13.93it/s]
 43%|████▎     | 369/861 [00:28<00:35, 13.87it/s]
 43%|████▎     | 371/861 [00:28<00:35, 13.92it/s]
 43%|████▎     | 373/861 [00:28<00:34, 13.97it/s]
 44%|████▎     | 375/861 [00:29<00:34, 13.89it/s]
 44%|████▍     | 377/861 [00:29<00:35, 13.76it/s]
 44%|████▍     | 379/861 [00:29<00:34, 13.84it/s]
 44%|████▍     | 381/861 [00:29<00:34, 13.89it/s]
 44%|████▍     | 383/861 [00:29<00:34, 13.86it/s]
 45%|████▍     | 385/861 [00:29<00:34, 13.92it/s]
 45%|████▍     | 387/861 [00:29<00:33, 13.95it/s]
 45%|████▌     | 389/861 [00:30<00:33, 13.97it/s]
 45%|████▌     | 391/861 [00:30<00:33, 13.99it/s]
 46%|████▌     | 393/861 [00:30<00:33, 14.00it/s]
 46%|████▌     | 395/861 [00:30<00:33, 14.00it/s]
 46%|████▌     | 397/861 [00:30<00:33, 13.88it/s]
 46%|████▋     | 399/861 [00:30<00:33, 13.87it/s]
 47%|████▋     | 401/861 [00:30<00:33, 13.94it/s]


== Status ==
Current time: 2024-03-07 21:32:00 (running for 00:06:49.20)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

 50%|█████     | 431/861 [00:33<00:30, 13.93it/s]
 50%|█████     | 433/861 [00:33<00:30, 13.95it/s]
 51%|█████     | 435/861 [00:33<00:30, 13.97it/s]
 51%|█████     | 437/861 [00:33<00:30, 13.97it/s]
 51%|█████     | 439/861 [00:33<00:30, 13.95it/s]
 51%|█████     | 441/861 [00:33<00:30, 13.98it/s]
 51%|█████▏    | 443/861 [00:33<00:29, 14.02it/s]
 52%|█████▏    | 445/861 [00:34<00:29, 14.01it/s]
 52%|█████▏    | 447/861 [00:34<00:29, 14.00it/s]
 52%|█████▏    | 449/861 [00:34<00:29, 14.01it/s]
 52%|█████▏    | 451/861 [00:34<00:29, 14.02it/s]
 53%|█████▎    | 453/861 [00:34<00:29, 13.89it/s]
 53%|█████▎    | 455/861 [00:34<00:29, 13.91it/s]
 53%|█████▎    | 457/861 [00:34<00:28, 13.96it/s]
 53%|█████▎    | 459/861 [00:35<00:28, 13.99it/s]
 54%|█████▎    | 461/861 [00:35<00:28, 14.01it/s]
 54%|█████▍    | 463/861 [00:35<00:28, 13.98it/s]
 54%|█████▍    | 465/861 [00:35<00:28, 13.99it/s]
 54%|█████▍    | 467/861 [00:35<00:28, 13.95it/s]
 54%|█████▍    | 469/861 [00:35<00:28, 13.97it/s]


[36m(_objective pid=9203)[0m {'loss': 0.7706, 'grad_norm': 7.573786735534668, 'learning_rate': 4.045080502131198e-05, 'epoch': 1.74}
== Status ==
Current time: 2024-03-07 21:32:05 (running for 00:06:54.24)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+-------------------

 58%|█████▊    | 501/861 [00:39<01:52,  3.21it/s]
 58%|█████▊    | 503/861 [00:39<01:25,  4.18it/s]
 59%|█████▊    | 505/861 [00:40<01:07,  5.29it/s]
 59%|█████▉    | 507/861 [00:40<00:54,  6.50it/s]
 59%|█████▉    | 509/861 [00:40<00:45,  7.75it/s]
 59%|█████▉    | 511/861 [00:40<00:39,  8.95it/s]
 60%|█████▉    | 513/861 [00:40<00:34, 10.04it/s]
 60%|█████▉    | 515/861 [00:40<00:31, 10.90it/s]
 60%|██████    | 517/861 [00:40<00:29, 11.69it/s]
 60%|██████    | 519/861 [00:41<00:27, 12.31it/s]
 61%|██████    | 521/861 [00:41<00:26, 12.75it/s]
 61%|██████    | 523/861 [00:41<00:25, 13.09it/s]
 61%|██████    | 525/861 [00:41<00:25, 13.38it/s]
 61%|██████    | 527/861 [00:41<00:24, 13.56it/s]
 61%|██████▏   | 529/861 [00:41<00:24, 13.66it/s]
 62%|██████▏   | 531/861 [00:41<00:23, 13.78it/s]
 62%|██████▏   | 533/861 [00:42<00:23, 13.86it/s]
 62%|██████▏   | 535/861 [00:42<00:23, 13.92it/s]
 62%|██████▏   | 537/861 [00:42<00:23, 13.92it/s]
 63%|██████▎   | 539/861 [00:42<00:23, 13.97it/s]


== Status ==
Current time: 2024-03-07 21:32:10 (running for 00:06:59.28)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

 64%|██████▍   | 553/861 [00:43<00:22, 13.97it/s]
 64%|██████▍   | 555/861 [00:43<00:21, 13.98it/s]
 65%|██████▍   | 557/861 [00:43<00:21, 13.98it/s]
 65%|██████▍   | 559/861 [00:43<00:21, 13.99it/s]
 65%|██████▌   | 561/861 [00:44<00:21, 14.03it/s]
 65%|██████▌   | 563/861 [00:44<00:21, 14.03it/s]
 66%|██████▌   | 565/861 [00:44<00:21, 14.02it/s]
 66%|██████▌   | 567/861 [00:44<00:20, 14.05it/s]
 66%|██████▌   | 569/861 [00:44<00:20, 14.00it/s]
 66%|██████▋   | 571/861 [00:44<00:20, 13.88it/s]
 67%|██████▋   | 573/861 [00:44<00:20, 13.93it/s]
[36m(_objective pid=9203)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=9203)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.58it/s][A
[36m(_objective pid=9203)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.33it/s][A
[36m(_objective pid=9203)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.66it/s][A
[36m(_objective pid=9203)[0m 
                                                 
 67%|██████▋   | 574/861 [00:46<00:20, 13.93it/s]
10

[36m(_objective pid=9203)[0m {'eval_loss': 0.7184261083602905, 'eval_accuracy': 0.4177215189873418, 'eval_runtime': 1.2989, 'eval_samples_per_second': 60.819, 'eval_steps_per_second': 3.849, 'epoch': 2.0}


 67%|██████▋   | 577/861 [00:46<00:59,  4.79it/s]
 67%|██████▋   | 579/861 [00:46<00:47,  5.97it/s]
 67%|██████▋   | 581/861 [00:46<00:39,  7.17it/s]
 68%|██████▊   | 583/861 [00:46<00:33,  8.41it/s]
 68%|██████▊   | 585/861 [00:47<00:28,  9.57it/s]
 68%|██████▊   | 587/861 [00:47<00:25, 10.57it/s]
 68%|██████▊   | 589/861 [00:47<00:23, 11.42it/s]
 69%|██████▊   | 591/861 [00:47<00:22, 12.09it/s]
 69%|██████▉   | 593/861 [00:47<00:21, 12.62it/s]
 69%|██████▉   | 595/861 [00:47<00:20, 13.00it/s]
 69%|██████▉   | 597/861 [00:47<00:19, 13.27it/s]
 70%|██████▉   | 599/861 [00:48<00:19, 13.49it/s]
 70%|██████▉   | 601/861 [00:48<00:19, 13.63it/s]


== Status ==
Current time: 2024-03-07 21:32:15 (running for 00:07:04.29)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

 70%|███████   | 603/861 [00:48<00:18, 13.75it/s]
 70%|███████   | 605/861 [00:48<00:18, 13.83it/s]
 70%|███████   | 607/861 [00:48<00:18, 13.87it/s]
 71%|███████   | 609/861 [00:48<00:18, 13.80it/s]
 71%|███████   | 611/861 [00:48<00:18, 13.88it/s]
 71%|███████   | 613/861 [00:49<00:17, 13.90it/s]
 71%|███████▏  | 615/861 [00:49<00:17, 13.92it/s]
 72%|███████▏  | 617/861 [00:49<00:17, 13.96it/s]
 72%|███████▏  | 619/861 [00:49<00:17, 13.97it/s]
 72%|███████▏  | 621/861 [00:49<00:17, 14.00it/s]
 72%|███████▏  | 623/861 [00:49<00:17, 13.99it/s]
 73%|███████▎  | 625/861 [00:49<00:16, 13.99it/s]
 73%|███████▎  | 627/861 [00:50<00:16, 14.01it/s]
 73%|███████▎  | 629/861 [00:50<00:16, 13.95it/s]
 73%|███████▎  | 631/861 [00:50<00:16, 13.97it/s]
 74%|███████▎  | 633/861 [00:50<00:16, 13.98it/s]
 74%|███████▍  | 635/861 [00:50<00:16, 13.99it/s]
 74%|███████▍  | 637/861 [00:50<00:16, 13.87it/s]
 74%|███████▍  | 639/861 [00:50<00:15, 13.94it/s]
 74%|███████▍  | 641/861 [00:51<00:15, 13.96it/s]


== Status ==
Current time: 2024-03-07 21:32:20 (running for 00:07:09.34)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

 78%|███████▊  | 673/861 [00:53<00:13, 13.98it/s]
 78%|███████▊  | 675/861 [00:53<00:13, 13.97it/s]
 79%|███████▊  | 677/861 [00:53<00:13, 13.96it/s]
 79%|███████▉  | 679/861 [00:53<00:13, 13.94it/s]
 79%|███████▉  | 681/861 [00:53<00:12, 13.95it/s]
 79%|███████▉  | 683/861 [00:54<00:12, 13.97it/s]
 80%|███████▉  | 685/861 [00:54<00:12, 13.97it/s]
 80%|███████▉  | 687/861 [00:54<00:12, 13.98it/s]
 80%|████████  | 689/861 [00:54<00:12, 13.98it/s]
 80%|████████  | 691/861 [00:54<00:12, 13.99it/s]
 80%|████████  | 693/861 [00:54<00:12, 13.84it/s]
 81%|████████  | 695/861 [00:54<00:11, 13.89it/s]
 81%|████████  | 697/861 [00:55<00:11, 13.94it/s]
 81%|████████  | 699/861 [00:55<00:11, 13.95it/s]
 81%|████████▏ | 701/861 [00:55<00:11, 13.97it/s]
 82%|████████▏ | 703/861 [00:55<00:11, 13.96it/s]
 82%|████████▏ | 705/861 [00:55<00:11, 13.98it/s]
 82%|████████▏ | 707/861 [00:55<00:11, 13.95it/s]
 82%|████████▏ | 709/861 [00:55<00:10, 13.94it/s]
 83%|████████▎ | 711/861 [00:56<00:10, 13.95it/s]


== Status ==
Current time: 2024-03-07 21:32:25 (running for 00:07:14.38)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

 86%|████████▋ | 743/861 [00:58<00:08, 13.95it/s]
 87%|████████▋ | 745/861 [00:58<00:08, 13.96it/s]
 87%|████████▋ | 747/861 [00:58<00:08, 13.97it/s]
 87%|████████▋ | 749/861 [00:58<00:08, 13.83it/s]
 87%|████████▋ | 751/861 [00:58<00:07, 13.91it/s]
 87%|████████▋ | 753/861 [00:59<00:07, 13.94it/s]
 88%|████████▊ | 755/861 [00:59<00:07, 13.94it/s]
 88%|████████▊ | 757/861 [00:59<00:07, 13.93it/s]
 88%|████████▊ | 759/861 [00:59<00:07, 13.94it/s]
 88%|████████▊ | 761/861 [00:59<00:07, 13.94it/s]
 89%|████████▊ | 763/861 [00:59<00:07, 13.93it/s]
 89%|████████▉ | 765/861 [00:59<00:06, 13.98it/s]
 89%|████████▉ | 767/861 [01:00<00:06, 14.00it/s]
 89%|████████▉ | 769/861 [01:00<00:06, 13.98it/s]
 90%|████████▉ | 771/861 [01:00<00:06, 13.98it/s]
 90%|████████▉ | 773/861 [01:00<00:06, 13.92it/s]
 90%|█████████ | 775/861 [01:00<00:06, 13.96it/s]
 90%|█████████ | 777/861 [01:00<00:06, 13.86it/s]
 90%|█████████ | 779/861 [01:00<00:05, 13.90it/s]
 91%|█████████ | 781/861 [01:01<00:05, 13.94it/s]


== Status ==
Current time: 2024-03-07 21:32:30 (running for 00:07:19.42)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 1 RUNNING, 4 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00004 | RUNNING    | 172.19.0.1:9203 |     9.64769e-05 | 

 95%|█████████▍| 815/861 [01:03<00:03, 13.93it/s]
 95%|█████████▍| 817/861 [01:03<00:03, 13.87it/s]
 95%|█████████▌| 819/861 [01:03<00:03, 13.91it/s]
 95%|█████████▌| 821/861 [01:03<00:02, 13.91it/s]
 96%|█████████▌| 823/861 [01:04<00:02, 13.94it/s]
 96%|█████████▌| 825/861 [01:04<00:02, 13.94it/s]
 96%|█████████▌| 827/861 [01:04<00:02, 13.97it/s]
 96%|█████████▋| 829/861 [01:04<00:02, 13.96it/s]
 97%|█████████▋| 831/861 [01:04<00:02, 13.88it/s]
 97%|█████████▋| 833/861 [01:04<00:02, 13.92it/s]
 97%|█████████▋| 835/861 [01:04<00:01, 13.93it/s]
 97%|█████████▋| 837/861 [01:05<00:01, 13.92it/s]
 97%|█████████▋| 839/861 [01:05<00:01, 13.95it/s]
 98%|█████████▊| 841/861 [01:05<00:01, 13.97it/s]
 98%|█████████▊| 843/861 [01:05<00:01, 13.97it/s]
 98%|█████████▊| 845/861 [01:05<00:01, 13.91it/s]
 98%|█████████▊| 847/861 [01:05<00:01, 13.94it/s]
 99%|█████████▊| 849/861 [01:05<00:00, 13.97it/s]
 99%|█████████▉| 851/861 [01:06<00:00, 13.99it/s]
 99%|█████████▉| 853/861 [01:06<00:00, 13.96it/s]


[36m(_objective pid=9203)[0m {'eval_loss': 0.7290337085723877, 'eval_accuracy': 0.4177215189873418, 'eval_runtime': 1.2957, 'eval_samples_per_second': 60.973, 'eval_steps_per_second': 3.859, 'epoch': 3.0}
[36m(_objective pid=9203)[0m {'train_runtime': 68.159, 'train_samples_per_second': 12.632, 'train_steps_per_second': 12.632, 'train_loss': 0.7492605955897031, 'epoch': 3.0}
== Status ==
Current time: 2024-03-07 21:32:35 (running for 00:07:24.47)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (10 PENDING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|          

[36m(_objective pid=9452)[0m 2024-03-07 21:32:40.670383: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=9452)[0m 2024-03-07 21:32:40.670445: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=9452)[0m 2024-03-07 21:32:40.671762: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
[36m(_objective pid=9452)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']

== Status ==
Current time: 2024-03-07 21:32:45 (running for 00:07:34.55)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

  1%|▏         | 19/1435 [00:01<01:43, 13.71it/s]
  1%|▏         | 21/1435 [00:01<01:42, 13.78it/s]
  2%|▏         | 23/1435 [00:01<01:42, 13.74it/s]
  2%|▏         | 25/1435 [00:01<01:41, 13.86it/s]
  2%|▏         | 27/1435 [00:02<01:41, 13.90it/s]
  2%|▏         | 29/1435 [00:02<01:40, 13.94it/s]
  2%|▏         | 31/1435 [00:02<01:40, 13.97it/s]
  2%|▏         | 33/1435 [00:02<01:40, 13.98it/s]
  2%|▏         | 35/1435 [00:02<01:40, 13.99it/s]
  3%|▎         | 37/1435 [00:02<01:40, 13.92it/s]
  3%|▎         | 39/1435 [00:02<01:39, 13.98it/s]
  3%|▎         | 41/1435 [00:03<01:40, 13.92it/s]
  3%|▎         | 43/1435 [00:03<01:39, 13.94it/s]
  3%|▎         | 45/1435 [00:03<01:39, 13.96it/s]
  3%|▎         | 47/1435 [00:03<01:39, 13.97it/s]
  3%|▎         | 49/1435 [00:03<01:40, 13.86it/s]
  4%|▎         | 51/1435 [00:03<01:40, 13.81it/s]
  4%|▎         | 53/1435 [00:04<01:39, 13.87it/s]
  4%|▍         | 55/1435 [00:04<01:39, 13.91it/s]
  4%|▍         | 57/1435 [00:04<01:39, 13.91it/s]


== Status ==
Current time: 2024-03-07 21:32:50 (running for 00:07:39.59)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

  6%|▌         | 89/1435 [00:06<01:36, 13.94it/s]
  6%|▋         | 91/1435 [00:06<01:36, 13.91it/s]
  6%|▋         | 93/1435 [00:06<01:36, 13.94it/s]
  7%|▋         | 95/1435 [00:07<01:35, 13.97it/s]
  7%|▋         | 97/1435 [00:07<01:35, 13.99it/s]
  7%|▋         | 99/1435 [00:07<01:35, 14.00it/s]
  7%|▋         | 101/1435 [00:07<01:35, 14.02it/s]
  7%|▋         | 103/1435 [00:07<01:35, 14.02it/s]
  7%|▋         | 105/1435 [00:07<01:35, 13.92it/s]
  7%|▋         | 107/1435 [00:07<01:35, 13.95it/s]
  8%|▊         | 109/1435 [00:08<01:34, 13.98it/s]
  8%|▊         | 111/1435 [00:08<01:34, 14.00it/s]
  8%|▊         | 113/1435 [00:08<01:34, 14.01it/s]
  8%|▊         | 115/1435 [00:08<01:34, 14.02it/s]
  8%|▊         | 117/1435 [00:08<01:34, 13.99it/s]
  8%|▊         | 119/1435 [00:08<01:34, 13.93it/s]
  8%|▊         | 121/1435 [00:08<01:34, 13.91it/s]
  9%|▊         | 123/1435 [00:09<01:34, 13.95it/s]
  9%|▊         | 125/1435 [00:09<01:33, 13.98it/s]
  9%|▉         | 127/1435 [00:09<01:3

== Status ==
Current time: 2024-03-07 21:32:55 (running for 00:07:44.63)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 11%|█         | 159/1435 [00:11<01:31, 13.98it/s]
 11%|█         | 161/1435 [00:11<01:31, 13.91it/s]
 11%|█▏        | 163/1435 [00:11<01:31, 13.94it/s]
 11%|█▏        | 165/1435 [00:12<01:30, 13.98it/s]
 12%|█▏        | 167/1435 [00:12<01:30, 13.99it/s]
 12%|█▏        | 169/1435 [00:12<01:30, 13.95it/s]
 12%|█▏        | 171/1435 [00:12<01:30, 13.97it/s]
 12%|█▏        | 173/1435 [00:12<01:30, 13.97it/s]
 12%|█▏        | 175/1435 [00:12<01:30, 13.92it/s]
 12%|█▏        | 177/1435 [00:12<01:30, 13.94it/s]
 12%|█▏        | 179/1435 [00:13<01:29, 13.97it/s]
 13%|█▎        | 181/1435 [00:13<01:29, 13.99it/s]
 13%|█▎        | 183/1435 [00:13<01:29, 14.01it/s]
 13%|█▎        | 185/1435 [00:13<01:29, 13.97it/s]
 13%|█▎        | 187/1435 [00:13<01:29, 13.94it/s]
 13%|█▎        | 189/1435 [00:13<01:29, 13.87it/s]
 13%|█▎        | 191/1435 [00:13<01:29, 13.92it/s]
 13%|█▎        | 193/1435 [00:14<01:29, 13.95it/s]
 14%|█▎        | 195/1435 [00:14<01:29, 13.83it/s]
 14%|█▎        | 197/1435 [00:1

== Status ==
Current time: 2024-03-07 21:33:00 (running for 00:07:49.67)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 16%|█▌        | 231/1435 [00:16<01:26, 13.93it/s]
 16%|█▌        | 233/1435 [00:16<01:26, 13.94it/s]
 16%|█▋        | 235/1435 [00:17<01:25, 13.98it/s]
 17%|█▋        | 237/1435 [00:17<01:25, 13.98it/s]
 17%|█▋        | 239/1435 [00:17<01:25, 13.98it/s]
 17%|█▋        | 241/1435 [00:17<01:25, 14.01it/s]
 17%|█▋        | 243/1435 [00:17<01:25, 14.00it/s]
 17%|█▋        | 245/1435 [00:17<01:25, 13.92it/s]
 17%|█▋        | 247/1435 [00:17<01:25, 13.95it/s]
 17%|█▋        | 249/1435 [00:18<01:25, 13.95it/s]
 17%|█▋        | 251/1435 [00:18<01:24, 13.96it/s]
 18%|█▊        | 253/1435 [00:18<01:24, 13.94it/s]
 18%|█▊        | 255/1435 [00:18<01:24, 13.99it/s]
 18%|█▊        | 257/1435 [00:18<01:24, 13.96it/s]
 18%|█▊        | 259/1435 [00:18<01:24, 13.93it/s]
 18%|█▊        | 261/1435 [00:18<01:24, 13.96it/s]
 18%|█▊        | 263/1435 [00:19<01:23, 13.98it/s]
 18%|█▊        | 265/1435 [00:19<01:23, 13.96it/s]
 19%|█▊        | 267/1435 [00:19<01:23, 13.94it/s]
 19%|█▊        | 269/1435 [00:1

== Status ==
Current time: 2024-03-07 21:33:05 (running for 00:07:54.71)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

[36m(_objective pid=9452)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.64it/s][A
[36m(_objective pid=9452)[0m 
                                                  
 20%|██        | 287/1435 [00:22<01:22, 13.96it/s]
100%|██████████| 5/5 [00:01<00:00,  4.48it/s][A
                                             [A


[36m(_objective pid=9452)[0m {'eval_loss': 0.7077564597129822, 'eval_accuracy': 0.4050632911392405, 'eval_runtime': 1.3046, 'eval_samples_per_second': 60.556, 'eval_steps_per_second': 3.833, 'epoch': 1.0}


 20%|██        | 289/1435 [00:22<05:07,  3.73it/s]
 20%|██        | 291/1435 [00:22<04:00,  4.76it/s]
 20%|██        | 293/1435 [00:22<03:12,  5.93it/s]
 21%|██        | 295/1435 [00:22<02:39,  7.16it/s]
 21%|██        | 297/1435 [00:22<02:15,  8.37it/s]
 21%|██        | 299/1435 [00:22<01:59,  9.52it/s]
 21%|██        | 301/1435 [00:23<01:47, 10.54it/s]
 21%|██        | 303/1435 [00:23<01:40, 11.30it/s]
 21%|██▏       | 305/1435 [00:23<01:34, 11.92it/s]
 21%|██▏       | 307/1435 [00:23<01:31, 12.39it/s]
 22%|██▏       | 309/1435 [00:23<01:27, 12.84it/s]
 22%|██▏       | 311/1435 [00:23<01:26, 13.05it/s]
 22%|██▏       | 313/1435 [00:23<01:24, 13.34it/s]
 22%|██▏       | 315/1435 [00:24<01:22, 13.55it/s]
 22%|██▏       | 317/1435 [00:24<01:21, 13.68it/s]
 22%|██▏       | 319/1435 [00:24<01:20, 13.78it/s]
 22%|██▏       | 321/1435 [00:24<01:20, 13.83it/s]
 23%|██▎       | 323/1435 [00:24<01:19, 13.92it/s]
 23%|██▎       | 325/1435 [00:24<01:20, 13.87it/s]
 23%|██▎       | 327/1435 [00:2

== Status ==
Current time: 2024-03-07 21:33:10 (running for 00:07:59.79)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 25%|██▍       | 353/1435 [00:26<01:17, 13.93it/s]
 25%|██▍       | 355/1435 [00:26<01:17, 13.98it/s]
 25%|██▍       | 357/1435 [00:27<01:17, 13.99it/s]
 25%|██▌       | 359/1435 [00:27<01:16, 13.99it/s]
 25%|██▌       | 361/1435 [00:27<01:16, 13.99it/s]
 25%|██▌       | 363/1435 [00:27<01:16, 13.98it/s]
 25%|██▌       | 365/1435 [00:27<01:16, 13.98it/s]
 26%|██▌       | 367/1435 [00:27<01:16, 13.92it/s]
 26%|██▌       | 369/1435 [00:27<01:16, 13.96it/s]
 26%|██▌       | 371/1435 [00:28<01:16, 13.98it/s]
 26%|██▌       | 373/1435 [00:28<01:15, 13.99it/s]
 26%|██▌       | 375/1435 [00:28<01:15, 13.96it/s]
 26%|██▋       | 377/1435 [00:28<01:15, 13.95it/s]
 26%|██▋       | 379/1435 [00:28<01:15, 13.97it/s]
 27%|██▋       | 381/1435 [00:28<01:15, 13.94it/s]
 27%|██▋       | 383/1435 [00:28<01:15, 13.97it/s]
 27%|██▋       | 385/1435 [00:29<01:15, 14.00it/s]
 27%|██▋       | 387/1435 [00:29<01:14, 14.02it/s]
 27%|██▋       | 389/1435 [00:29<01:14, 14.02it/s]
 27%|██▋       | 391/1435 [00:2

== Status ==
Current time: 2024-03-07 21:33:15 (running for 00:08:04.84)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 30%|██▉       | 425/1435 [00:31<01:12, 13.93it/s]
 30%|██▉       | 427/1435 [00:32<01:12, 13.97it/s]
 30%|██▉       | 429/1435 [00:32<01:11, 13.98it/s]
 30%|███       | 431/1435 [00:32<01:11, 13.95it/s]
 30%|███       | 433/1435 [00:32<01:11, 13.96it/s]
 30%|███       | 435/1435 [00:32<01:11, 13.96it/s]
 30%|███       | 437/1435 [00:32<01:11, 13.92it/s]
 31%|███       | 439/1435 [00:32<01:11, 13.92it/s]
 31%|███       | 441/1435 [00:33<01:11, 13.97it/s]
 31%|███       | 443/1435 [00:33<01:10, 13.98it/s]
 31%|███       | 445/1435 [00:33<01:10, 13.98it/s]
 31%|███       | 447/1435 [00:33<01:11, 13.91it/s]
 31%|███▏      | 449/1435 [00:33<01:10, 13.93it/s]
 31%|███▏      | 451/1435 [00:33<01:10, 13.87it/s]
 32%|███▏      | 453/1435 [00:33<01:10, 13.93it/s]
 32%|███▏      | 455/1435 [00:34<01:10, 13.97it/s]
 32%|███▏      | 457/1435 [00:34<01:10, 13.93it/s]
 32%|███▏      | 459/1435 [00:34<01:09, 13.95it/s]
 32%|███▏      | 461/1435 [00:34<01:10, 13.91it/s]
 32%|███▏      | 463/1435 [00:3

== Status ==
Current time: 2024-03-07 21:33:20 (running for 00:08:09.88)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 34%|███▍      | 495/1435 [00:37<01:07, 13.99it/s]
 35%|███▍      | 497/1435 [00:37<01:06, 14.00it/s]
 35%|███▍      | 500/1435 [00:37<01:06, 14.00it/s]


[36m(_objective pid=9452)[0m {'loss': 0.7396, 'grad_norm': 23.060691833496094, 'learning_rate': 4.762661844305631e-06, 'epoch': 1.74}


 35%|███▍      | 501/1435 [00:39<04:54,  3.18it/s]
 35%|███▌      | 503/1435 [00:39<03:45,  4.14it/s]
 35%|███▌      | 505/1435 [00:39<02:57,  5.24it/s]
 35%|███▌      | 507/1435 [00:39<02:23,  6.45it/s]
 35%|███▌      | 509/1435 [00:39<02:00,  7.70it/s]
 36%|███▌      | 511/1435 [00:39<01:44,  8.87it/s]
 36%|███▌      | 513/1435 [00:39<01:32,  9.95it/s]
 36%|███▌      | 515/1435 [00:40<01:24, 10.90it/s]
 36%|███▌      | 517/1435 [00:40<01:18, 11.69it/s]
 36%|███▌      | 519/1435 [00:40<01:14, 12.30it/s]
 36%|███▋      | 521/1435 [00:40<01:11, 12.75it/s]
 36%|███▋      | 523/1435 [00:40<01:09, 13.10it/s]
 37%|███▋      | 525/1435 [00:40<01:08, 13.31it/s]
 37%|███▋      | 527/1435 [00:40<01:07, 13.52it/s]
 37%|███▋      | 529/1435 [00:41<01:06, 13.67it/s]
 37%|███▋      | 531/1435 [00:41<01:06, 13.61it/s]
 37%|███▋      | 533/1435 [00:41<01:06, 13.62it/s]
 37%|███▋      | 535/1435 [00:41<01:05, 13.75it/s]
 37%|███▋      | 537/1435 [00:41<01:05, 13.77it/s]
 38%|███▊      | 539/1435 [00:4

== Status ==
Current time: 2024-03-07 21:33:25 (running for 00:08:14.92)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 38%|███▊      | 543/1435 [00:42<01:04, 13.89it/s]
 38%|███▊      | 545/1435 [00:42<01:03, 13.93it/s]
 38%|███▊      | 547/1435 [00:42<01:03, 13.92it/s]
 38%|███▊      | 549/1435 [00:42<01:03, 13.98it/s]
 38%|███▊      | 551/1435 [00:42<01:03, 13.96it/s]
 39%|███▊      | 553/1435 [00:42<01:03, 13.91it/s]
 39%|███▊      | 555/1435 [00:42<01:03, 13.97it/s]
 39%|███▉      | 557/1435 [00:43<01:02, 14.00it/s]
 39%|███▉      | 559/1435 [00:43<01:02, 14.01it/s]
 39%|███▉      | 561/1435 [00:43<01:02, 13.99it/s]
 39%|███▉      | 563/1435 [00:43<01:02, 13.98it/s]
 39%|███▉      | 565/1435 [00:43<01:02, 13.99it/s]
 40%|███▉      | 567/1435 [00:43<01:02, 13.92it/s]
 40%|███▉      | 569/1435 [00:43<01:02, 13.95it/s]
 40%|███▉      | 571/1435 [00:44<01:01, 13.99it/s]
 40%|███▉      | 573/1435 [00:44<01:01, 13.98it/s]
[36m(_objective pid=9452)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
 40%|████      | 2/5 [00:00<00:00,  7.48it/s][A
[36m(_objective pid=9452)[0m 
 60%|██████    | 3/5 [00:00<00

[36m(_objective pid=9452)[0m {'eval_loss': 0.671744167804718, 'eval_accuracy': 0.5822784810126582, 'eval_runtime': 1.5372, 'eval_samples_per_second': 51.393, 'eval_steps_per_second': 3.253, 'epoch': 2.0}


 40%|████      | 577/1435 [00:46<03:20,  4.28it/s]
 40%|████      | 579/1435 [00:46<02:38,  5.41it/s]
 40%|████      | 581/1435 [00:46<02:08,  6.63it/s]
 41%|████      | 583/1435 [00:46<01:48,  7.87it/s]
 41%|████      | 585/1435 [00:46<01:33,  9.06it/s]
 41%|████      | 587/1435 [00:46<01:24, 10.09it/s]
 41%|████      | 589/1435 [00:46<01:16, 11.03it/s]


== Status ==
Current time: 2024-03-07 21:33:30 (running for 00:08:20.00)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 41%|████      | 591/1435 [00:47<01:11, 11.76it/s]
 41%|████▏     | 593/1435 [00:47<01:08, 12.35it/s]
 41%|████▏     | 595/1435 [00:47<01:05, 12.81it/s]
 42%|████▏     | 597/1435 [00:47<01:03, 13.16it/s]
 42%|████▏     | 599/1435 [00:47<01:02, 13.39it/s]
 42%|████▏     | 601/1435 [00:47<01:01, 13.48it/s]
 42%|████▏     | 603/1435 [00:47<01:01, 13.63it/s]
 42%|████▏     | 605/1435 [00:48<01:00, 13.75it/s]
 42%|████▏     | 607/1435 [00:48<00:59, 13.81it/s]
 42%|████▏     | 609/1435 [00:48<00:59, 13.83it/s]
 43%|████▎     | 611/1435 [00:48<00:59, 13.88it/s]
 43%|████▎     | 613/1435 [00:48<00:59, 13.88it/s]
 43%|████▎     | 615/1435 [00:48<00:59, 13.84it/s]
 43%|████▎     | 617/1435 [00:48<00:58, 13.90it/s]
 43%|████▎     | 619/1435 [00:49<00:58, 13.94it/s]
 43%|████▎     | 621/1435 [00:49<00:58, 13.96it/s]
 43%|████▎     | 623/1435 [00:49<00:58, 13.94it/s]
 44%|████▎     | 625/1435 [00:49<00:58, 13.96it/s]
 44%|████▎     | 627/1435 [00:49<00:57, 13.98it/s]
 44%|████▍     | 629/1435 [00:4

== Status ==
Current time: 2024-03-07 21:33:35 (running for 00:08:25.04)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 46%|████▌     | 663/1435 [00:52<00:55, 13.98it/s]
 46%|████▋     | 665/1435 [00:52<00:55, 14.00it/s]
 46%|████▋     | 667/1435 [00:52<00:54, 14.01it/s]
 47%|████▋     | 669/1435 [00:52<00:54, 13.97it/s]
 47%|████▋     | 671/1435 [00:52<00:54, 13.90it/s]
 47%|████▋     | 673/1435 [00:52<00:54, 13.93it/s]
 47%|████▋     | 675/1435 [00:53<00:54, 13.96it/s]
 47%|████▋     | 677/1435 [00:53<00:54, 13.98it/s]
 47%|████▋     | 679/1435 [00:53<00:53, 14.00it/s]
 47%|████▋     | 681/1435 [00:53<00:53, 13.99it/s]
 48%|████▊     | 683/1435 [00:53<00:53, 13.99it/s]
 48%|████▊     | 685/1435 [00:53<00:53, 13.93it/s]
 48%|████▊     | 687/1435 [00:53<00:53, 13.93it/s]
 48%|████▊     | 689/1435 [00:54<00:53, 13.96it/s]
 48%|████▊     | 691/1435 [00:54<00:53, 13.99it/s]
 48%|████▊     | 693/1435 [00:54<00:52, 14.00it/s]
 48%|████▊     | 695/1435 [00:54<00:52, 14.00it/s]
 49%|████▊     | 697/1435 [00:54<00:52, 13.97it/s]
 49%|████▊     | 699/1435 [00:54<00:52, 13.92it/s]
 49%|████▉     | 701/1435 [00:5

== Status ==
Current time: 2024-03-07 21:33:41 (running for 00:08:30.09)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 51%|█████     | 733/1435 [00:57<00:50, 14.01it/s]
 51%|█████     | 735/1435 [00:57<00:50, 13.96it/s]
 51%|█████▏    | 737/1435 [00:57<00:50, 13.95it/s]
 51%|█████▏    | 739/1435 [00:57<00:49, 13.96it/s]
 52%|█████▏    | 741/1435 [00:57<00:49, 13.91it/s]
 52%|█████▏    | 743/1435 [00:57<00:49, 13.94it/s]
 52%|█████▏    | 745/1435 [00:58<00:49, 13.95it/s]
 52%|█████▏    | 747/1435 [00:58<00:49, 13.97it/s]
 52%|█████▏    | 749/1435 [00:58<00:49, 13.96it/s]
 52%|█████▏    | 751/1435 [00:58<00:49, 13.92it/s]
 52%|█████▏    | 753/1435 [00:58<00:49, 13.90it/s]
 53%|█████▎    | 755/1435 [00:58<00:48, 13.90it/s]
 53%|█████▎    | 757/1435 [00:58<00:48, 13.95it/s]
 53%|█████▎    | 759/1435 [00:59<00:48, 13.96it/s]
 53%|█████▎    | 761/1435 [00:59<00:48, 13.98it/s]
 53%|█████▎    | 763/1435 [00:59<00:48, 13.98it/s]
 53%|█████▎    | 765/1435 [00:59<00:47, 13.98it/s]
 53%|█████▎    | 767/1435 [00:59<00:47, 13.95it/s]
 54%|█████▎    | 769/1435 [00:59<00:47, 13.90it/s]
 54%|█████▎    | 771/1435 [00:5

== Status ==
Current time: 2024-03-07 21:33:46 (running for 00:08:35.13)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 56%|█████▌    | 801/1435 [01:02<00:45, 13.94it/s]
 56%|█████▌    | 803/1435 [01:02<00:45, 13.94it/s]
 56%|█████▌    | 805/1435 [01:02<00:44, 14.00it/s]
 56%|█████▌    | 807/1435 [01:02<00:44, 13.97it/s]
 56%|█████▋    | 809/1435 [01:02<00:44, 13.99it/s]
 57%|█████▋    | 811/1435 [01:02<00:44, 13.95it/s]
 57%|█████▋    | 813/1435 [01:02<00:44, 13.98it/s]
 57%|█████▋    | 815/1435 [01:03<00:44, 13.96it/s]
 57%|█████▋    | 817/1435 [01:03<00:44, 13.96it/s]
 57%|█████▋    | 819/1435 [01:03<00:44, 14.00it/s]
 57%|█████▋    | 821/1435 [01:03<00:43, 13.98it/s]
 57%|█████▋    | 823/1435 [01:03<00:43, 13.97it/s]
 57%|█████▋    | 825/1435 [01:03<00:43, 13.89it/s]
 58%|█████▊    | 827/1435 [01:03<00:43, 13.94it/s]
 58%|█████▊    | 829/1435 [01:04<00:43, 13.97it/s]
 58%|█████▊    | 831/1435 [01:04<00:43, 13.91it/s]
 58%|█████▊    | 833/1435 [01:04<00:43, 13.96it/s]
 58%|█████▊    | 835/1435 [01:04<00:43, 13.94it/s]
 58%|█████▊    | 837/1435 [01:04<00:42, 13.95it/s]
 58%|█████▊    | 839/1435 [01:0

== Status ==
Current time: 2024-03-07 21:33:51 (running for 00:08:40.17)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

[36m(_objective pid=9452)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.65it/s][A
[36m(_objective pid=9452)[0m 
                                                  
 60%|██████    | 861/1435 [01:07<00:40, 14.01it/s]
100%|██████████| 5/5 [00:01<00:00,  4.46it/s][A
                                             [A


[36m(_objective pid=9452)[0m {'eval_loss': 0.6615515351295471, 'eval_accuracy': 0.6329113924050633, 'eval_runtime': 1.3002, 'eval_samples_per_second': 60.758, 'eval_steps_per_second': 3.845, 'epoch': 3.0}


 60%|██████    | 863/1435 [01:07<02:33,  3.74it/s]
 60%|██████    | 865/1435 [01:07<01:59,  4.77it/s]
 60%|██████    | 867/1435 [01:08<01:35,  5.94it/s]
 61%|██████    | 869/1435 [01:08<01:18,  7.18it/s]
 61%|██████    | 871/1435 [01:08<01:07,  8.41it/s]
 61%|██████    | 873/1435 [01:08<00:58,  9.55it/s]
 61%|██████    | 875/1435 [01:08<00:53, 10.56it/s]
 61%|██████    | 877/1435 [01:08<00:49, 11.35it/s]
 61%|██████▏   | 879/1435 [01:08<00:46, 12.02it/s]
 61%|██████▏   | 881/1435 [01:09<00:44, 12.55it/s]
 62%|██████▏   | 883/1435 [01:09<00:42, 12.96it/s]
 62%|██████▏   | 885/1435 [01:09<00:41, 13.26it/s]
 62%|██████▏   | 887/1435 [01:09<00:40, 13.47it/s]
 62%|██████▏   | 889/1435 [01:09<00:40, 13.60it/s]
 62%|██████▏   | 891/1435 [01:09<00:39, 13.64it/s]
 62%|██████▏   | 893/1435 [01:09<00:39, 13.75it/s]
 62%|██████▏   | 895/1435 [01:10<00:39, 13.78it/s]
 63%|██████▎   | 897/1435 [01:10<00:38, 13.84it/s]
 63%|██████▎   | 899/1435 [01:10<00:38, 13.90it/s]
 63%|██████▎   | 901/1435 [01:1

== Status ==
Current time: 2024-03-07 21:33:56 (running for 00:08:45.19)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 64%|██████▍   | 925/1435 [01:12<00:36, 13.95it/s]
 65%|██████▍   | 927/1435 [01:12<00:36, 13.98it/s]
 65%|██████▍   | 929/1435 [01:12<00:36, 13.97it/s]
 65%|██████▍   | 931/1435 [01:12<00:36, 13.97it/s]
 65%|██████▌   | 933/1435 [01:12<00:36, 13.94it/s]
 65%|██████▌   | 935/1435 [01:13<00:35, 13.96it/s]
 65%|██████▌   | 937/1435 [01:13<00:35, 13.98it/s]
 65%|██████▌   | 939/1435 [01:13<00:35, 13.99it/s]
 66%|██████▌   | 941/1435 [01:13<00:35, 14.00it/s]
 66%|██████▌   | 943/1435 [01:13<00:35, 13.95it/s]
 66%|██████▌   | 945/1435 [01:13<00:35, 13.92it/s]
 66%|██████▌   | 947/1435 [01:13<00:35, 13.91it/s]
 66%|██████▌   | 949/1435 [01:14<00:34, 13.95it/s]
 66%|██████▋   | 951/1435 [01:14<00:34, 13.98it/s]
 66%|██████▋   | 953/1435 [01:14<00:34, 13.99it/s]
 67%|██████▋   | 955/1435 [01:14<00:34, 14.00it/s]
 67%|██████▋   | 957/1435 [01:14<00:34, 13.98it/s]
 67%|██████▋   | 959/1435 [01:14<00:34, 13.91it/s]
 67%|██████▋   | 961/1435 [01:14<00:34, 13.94it/s]
 67%|██████▋   | 963/1435 [01:1

== Status ==
Current time: 2024-03-07 21:34:01 (running for 00:08:50.24)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 69%|██████▉   | 995/1435 [01:17<00:31, 13.94it/s]
 69%|██████▉   | 997/1435 [01:17<00:31, 13.96it/s]
 70%|██████▉   | 999/1435 [01:17<00:31, 13.95it/s]
 70%|██████▉   | 1000/1435 [01:17<00:31, 13.95it/s]


[36m(_objective pid=9452)[0m {'loss': 0.6302, 'grad_norm': 17.61677360534668, 'learning_rate': 2.215783852698342e-06, 'epoch': 3.48}


 70%|██████▉   | 1001/1435 [01:19<02:16,  3.18it/s]
 70%|██████▉   | 1003/1435 [01:19<01:44,  4.15it/s]
 70%|███████   | 1005/1435 [01:19<01:21,  5.25it/s]
 70%|███████   | 1007/1435 [01:19<01:06,  6.44it/s]
 70%|███████   | 1009/1435 [01:19<00:55,  7.69it/s]
 70%|███████   | 1011/1435 [01:20<00:47,  8.90it/s]
 71%|███████   | 1013/1435 [01:20<00:42,  9.99it/s]
 71%|███████   | 1015/1435 [01:20<00:38, 10.92it/s]
 71%|███████   | 1017/1435 [01:20<00:35, 11.70it/s]
 71%|███████   | 1019/1435 [01:20<00:33, 12.27it/s]
 71%|███████   | 1021/1435 [01:20<00:32, 12.71it/s]
 71%|███████▏  | 1023/1435 [01:20<00:31, 13.08it/s]
 71%|███████▏  | 1025/1435 [01:21<00:30, 13.36it/s]
 72%|███████▏  | 1027/1435 [01:21<00:30, 13.55it/s]
 72%|███████▏  | 1029/1435 [01:21<00:29, 13.68it/s]
 72%|███████▏  | 1031/1435 [01:21<00:29, 13.74it/s]
 72%|███████▏  | 1033/1435 [01:21<00:29, 13.80it/s]
 72%|███████▏  | 1035/1435 [01:21<00:29, 13.79it/s]
 72%|███████▏  | 1037/1435 [01:21<00:28, 13.84it/s]
 72%|███████

== Status ==
Current time: 2024-03-07 21:34:06 (running for 00:08:55.28)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 73%|███████▎  | 1041/1435 [01:22<00:28, 13.92it/s]
 73%|███████▎  | 1043/1435 [01:22<00:28, 13.96it/s]
 73%|███████▎  | 1045/1435 [01:22<00:27, 13.98it/s]
 73%|███████▎  | 1047/1435 [01:22<00:27, 13.92it/s]
 73%|███████▎  | 1049/1435 [01:22<00:27, 13.89it/s]
 73%|███████▎  | 1051/1435 [01:22<00:27, 13.94it/s]
 73%|███████▎  | 1053/1435 [01:23<00:27, 13.97it/s]
 74%|███████▎  | 1055/1435 [01:23<00:27, 13.98it/s]
 74%|███████▎  | 1057/1435 [01:23<00:27, 13.98it/s]
 74%|███████▍  | 1059/1435 [01:23<00:26, 13.98it/s]
 74%|███████▍  | 1061/1435 [01:23<00:26, 13.95it/s]
 74%|███████▍  | 1063/1435 [01:23<00:26, 13.84it/s]
 74%|███████▍  | 1065/1435 [01:23<00:26, 13.90it/s]
 74%|███████▍  | 1067/1435 [01:24<00:26, 13.94it/s]
 74%|███████▍  | 1069/1435 [01:24<00:26, 13.97it/s]
 75%|███████▍  | 1071/1435 [01:24<00:26, 13.99it/s]
 75%|███████▍  | 1073/1435 [01:24<00:25, 13.99it/s]
 75%|███████▍  | 1075/1435 [01:24<00:25, 13.93it/s]
 75%|███████▌  | 1077/1435 [01:24<00:25, 13.90it/s]
 75%|███████

== Status ==
Current time: 2024-03-07 21:34:11 (running for 00:09:00.33)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 78%|███████▊  | 1115/1435 [01:27<00:22, 13.94it/s]
 78%|███████▊  | 1117/1435 [01:27<00:22, 13.97it/s]
 78%|███████▊  | 1119/1435 [01:27<00:22, 13.92it/s]
 78%|███████▊  | 1121/1435 [01:27<00:22, 13.96it/s]
 78%|███████▊  | 1123/1435 [01:28<00:22, 13.98it/s]
 78%|███████▊  | 1125/1435 [01:28<00:22, 13.91it/s]
 79%|███████▊  | 1127/1435 [01:28<00:22, 13.94it/s]
 79%|███████▊  | 1129/1435 [01:28<00:21, 13.96it/s]
 79%|███████▉  | 1131/1435 [01:28<00:21, 13.98it/s]
 79%|███████▉  | 1133/1435 [01:28<00:21, 13.96it/s]
 79%|███████▉  | 1135/1435 [01:28<00:21, 13.85it/s]
 79%|███████▉  | 1137/1435 [01:29<00:21, 13.72it/s]
 79%|███████▉  | 1139/1435 [01:29<00:21, 13.80it/s]
 80%|███████▉  | 1141/1435 [01:29<00:21, 13.83it/s]
 80%|███████▉  | 1143/1435 [01:29<00:21, 13.88it/s]
 80%|███████▉  | 1145/1435 [01:29<00:20, 13.91it/s]
 80%|███████▉  | 1147/1435 [01:29<00:20, 13.87it/s]
[36m(_objective pid=9452)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=9452)[0m 
 40%|████  

[36m(_objective pid=9452)[0m {'eval_loss': 0.856070876121521, 'eval_accuracy': 0.6329113924050633, 'eval_runtime': 1.9609, 'eval_samples_per_second': 40.287, 'eval_steps_per_second': 2.55, 'epoch': 4.0}


 80%|████████  | 1151/1435 [01:32<01:18,  3.60it/s]
 80%|████████  | 1153/1435 [01:32<01:00,  4.63it/s]
 80%|████████  | 1155/1435 [01:32<00:48,  5.79it/s]


== Status ==
Current time: 2024-03-07 21:34:16 (running for 00:09:05.36)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 81%|████████  | 1157/1435 [01:32<00:39,  7.02it/s]
 81%|████████  | 1159/1435 [01:32<00:33,  8.25it/s]
 81%|████████  | 1161/1435 [01:32<00:29,  9.30it/s]
 81%|████████  | 1163/1435 [01:32<00:26, 10.22it/s]
 81%|████████  | 1165/1435 [01:33<00:24, 11.13it/s]
 81%|████████▏ | 1167/1435 [01:33<00:22, 11.84it/s]
 81%|████████▏ | 1169/1435 [01:33<00:21, 12.40it/s]
 82%|████████▏ | 1171/1435 [01:33<00:20, 12.83it/s]
 82%|████████▏ | 1173/1435 [01:33<00:19, 13.15it/s]
 82%|████████▏ | 1175/1435 [01:33<00:19, 13.32it/s]
 82%|████████▏ | 1177/1435 [01:33<00:19, 13.50it/s]
 82%|████████▏ | 1179/1435 [01:34<00:18, 13.65it/s]
 82%|████████▏ | 1181/1435 [01:34<00:18, 13.73it/s]
 82%|████████▏ | 1183/1435 [01:34<00:18, 13.73it/s]
 83%|████████▎ | 1185/1435 [01:34<00:18, 13.84it/s]
 83%|████████▎ | 1187/1435 [01:34<00:17, 13.89it/s]
 83%|████████▎ | 1189/1435 [01:34<00:17, 13.89it/s]
 83%|████████▎ | 1191/1435 [01:34<00:17, 13.94it/s]
 83%|████████▎ | 1193/1435 [01:35<00:17, 13.93it/s]
 83%|███████

== Status ==
Current time: 2024-03-07 21:34:21 (running for 00:09:10.41)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 85%|████████▌ | 1225/1435 [01:37<00:15, 13.93it/s]
 86%|████████▌ | 1227/1435 [01:37<00:14, 13.94it/s]
 86%|████████▌ | 1229/1435 [01:37<00:14, 13.97it/s]
 86%|████████▌ | 1231/1435 [01:37<00:14, 13.89it/s]
 86%|████████▌ | 1233/1435 [01:38<00:14, 13.90it/s]
 86%|████████▌ | 1235/1435 [01:38<00:14, 13.94it/s]
 86%|████████▌ | 1237/1435 [01:38<00:14, 13.97it/s]
 86%|████████▋ | 1239/1435 [01:38<00:14, 13.95it/s]
 86%|████████▋ | 1241/1435 [01:38<00:13, 13.91it/s]
 87%|████████▋ | 1243/1435 [01:38<00:13, 13.90it/s]
 87%|████████▋ | 1245/1435 [01:38<00:13, 13.90it/s]
 87%|████████▋ | 1247/1435 [01:39<00:13, 13.93it/s]
 87%|████████▋ | 1249/1435 [01:39<00:13, 13.92it/s]
 87%|████████▋ | 1251/1435 [01:39<00:13, 13.94it/s]
 87%|████████▋ | 1253/1435 [01:39<00:13, 13.96it/s]
 87%|████████▋ | 1255/1435 [01:39<00:12, 13.97it/s]
 88%|████████▊ | 1257/1435 [01:39<00:12, 13.95it/s]
 88%|████████▊ | 1259/1435 [01:39<00:12, 13.92it/s]
 88%|████████▊ | 1261/1435 [01:40<00:12, 13.93it/s]
 88%|███████

== Status ==
Current time: 2024-03-07 21:34:26 (running for 00:09:15.45)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 90%|█████████ | 1295/1435 [01:42<00:10, 13.97it/s]
 90%|█████████ | 1297/1435 [01:42<00:09, 13.96it/s]
 91%|█████████ | 1299/1435 [01:42<00:09, 13.91it/s]
 91%|█████████ | 1301/1435 [01:42<00:09, 13.96it/s]
 91%|█████████ | 1303/1435 [01:43<00:09, 13.94it/s]
 91%|█████████ | 1305/1435 [01:43<00:09, 13.93it/s]
 91%|█████████ | 1307/1435 [01:43<00:09, 13.95it/s]
 91%|█████████ | 1309/1435 [01:43<00:09, 13.98it/s]
 91%|█████████▏| 1311/1435 [01:43<00:08, 13.94it/s]
 91%|█████████▏| 1313/1435 [01:43<00:08, 13.84it/s]
 92%|█████████▏| 1315/1435 [01:43<00:08, 13.91it/s]
 92%|█████████▏| 1317/1435 [01:44<00:08, 13.92it/s]
 92%|█████████▏| 1319/1435 [01:44<00:08, 13.95it/s]
 92%|█████████▏| 1321/1435 [01:44<00:08, 13.93it/s]
 92%|█████████▏| 1323/1435 [01:44<00:08, 13.96it/s]
 92%|█████████▏| 1325/1435 [01:44<00:07, 13.96it/s]
 92%|█████████▏| 1327/1435 [01:44<00:07, 13.90it/s]
 93%|█████████▎| 1329/1435 [01:44<00:07, 13.94it/s]
 93%|█████████▎| 1331/1435 [01:45<00:07, 13.96it/s]
 93%|███████

== Status ==
Current time: 2024-03-07 21:34:31 (running for 00:09:20.50)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

 95%|█████████▌| 1367/1435 [01:47<00:04, 13.94it/s]
 95%|█████████▌| 1369/1435 [01:47<00:04, 13.85it/s]
 96%|█████████▌| 1371/1435 [01:47<00:04, 13.91it/s]
 96%|█████████▌| 1373/1435 [01:48<00:04, 13.82it/s]
 96%|█████████▌| 1375/1435 [01:48<00:04, 13.77it/s]
 96%|█████████▌| 1377/1435 [01:48<00:04, 13.84it/s]
 96%|█████████▌| 1379/1435 [01:48<00:04, 13.89it/s]
 96%|█████████▌| 1381/1435 [01:48<00:03, 13.87it/s]
 96%|█████████▋| 1383/1435 [01:48<00:03, 13.83it/s]
 97%|█████████▋| 1385/1435 [01:48<00:03, 13.89it/s]
 97%|█████████▋| 1387/1435 [01:49<00:03, 13.95it/s]
 97%|█████████▋| 1389/1435 [01:49<00:03, 13.98it/s]
 97%|█████████▋| 1391/1435 [01:49<00:03, 13.99it/s]
 97%|█████████▋| 1393/1435 [01:49<00:03, 13.99it/s]
 97%|█████████▋| 1395/1435 [01:49<00:02, 13.93it/s]
 97%|█████████▋| 1397/1435 [01:49<00:02, 13.86it/s]
 97%|█████████▋| 1399/1435 [01:49<00:02, 13.90it/s]
 98%|█████████▊| 1401/1435 [01:50<00:02, 13.88it/s]
 98%|█████████▊| 1403/1435 [01:50<00:02, 13.91it/s]
 98%|███████

== Status ==
Current time: 2024-03-07 21:34:36 (running for 00:09:25.54)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 1 RUNNING, 5 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00005 | RUNNING    | 172.19.0.1:9452 |     7.30954e-06 |  

100%|██████████| 1435/1435 [01:52<00:00, 13.98it/s]
[36m(_objective pid=9452)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=9452)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.62it/s][A
[36m(_objective pid=9452)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.36it/s][A
[36m(_objective pid=9452)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.64it/s][A
[36m(_objective pid=9452)[0m 
                                                   
100%|██████████| 1435/1435 [01:53<00:00, 13.98it/s]
100%|██████████| 5/5 [00:01<00:00,  4.45it/s][A
100%|██████████| 1435/1435 [01:53<00:00, 12.61it/s]


[36m(_objective pid=9452)[0m {'eval_loss': 0.9786921739578247, 'eval_accuracy': 0.6455696202531646, 'eval_runtime': 1.3023, 'eval_samples_per_second': 60.664, 'eval_steps_per_second': 3.839, 'epoch': 5.0}
[36m(_objective pid=9452)[0m {'train_runtime': 113.8161, 'train_samples_per_second': 12.608, 'train_steps_per_second': 12.608, 'train_loss': 0.6675413125068053, 'epoch': 5.0}
== Status ==
Current time: 2024-03-07 21:34:41 (running for 00:09:30.62)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (9 PENDING, 6 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|         

[36m(_objective pid=9810)[0m 2024-03-07 21:34:43.637111: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=9810)[0m 2024-03-07 21:34:43.637164: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=9810)[0m 2024-03-07 21:34:43.638537: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
[36m(_objective pid=9810)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']

== Status ==
Current time: 2024-03-07 21:34:46 (running for 00:09:35.70)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (8 PENDING, 1 RUNNING, 6 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00006 | RUNNING    | 172.19.0.1:9810 |     1.90102e-06 |  

  0%|          | 0/108 [00:00<?, ?it/s]
  1%|          | 1/108 [00:00<00:58,  1.81it/s]
  2%|▏         | 2/108 [00:00<00:45,  2.35it/s]
  3%|▎         | 3/108 [00:01<00:41,  2.54it/s]
  4%|▎         | 4/108 [00:01<00:39,  2.64it/s]
  5%|▍         | 5/108 [00:01<00:38,  2.69it/s]
  6%|▌         | 6/108 [00:02<00:37,  2.74it/s]
  6%|▋         | 7/108 [00:02<00:36,  2.75it/s]
  7%|▋         | 8/108 [00:03<00:36,  2.77it/s]
  8%|▊         | 9/108 [00:03<00:35,  2.78it/s]
  9%|▉         | 10/108 [00:03<00:35,  2.79it/s]
 10%|█         | 11/108 [00:04<00:34,  2.79it/s]
 11%|█         | 12/108 [00:04<00:34,  2.80it/s]


== Status ==
Current time: 2024-03-07 21:34:51 (running for 00:09:40.75)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (8 PENDING, 1 RUNNING, 6 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00006 | RUNNING    | 172.19.0.1:9810 |     1.90102e-06 |  

 12%|█▏        | 13/108 [00:04<00:33,  2.80it/s]
 13%|█▎        | 14/108 [00:05<00:33,  2.80it/s]
 14%|█▍        | 15/108 [00:05<00:33,  2.81it/s]
 15%|█▍        | 16/108 [00:05<00:32,  2.80it/s]
 16%|█▌        | 17/108 [00:06<00:32,  2.81it/s]
 17%|█▋        | 18/108 [00:06<00:32,  2.81it/s]
 18%|█▊        | 19/108 [00:06<00:31,  2.81it/s]
 19%|█▊        | 20/108 [00:07<00:31,  2.81it/s]
 19%|█▉        | 21/108 [00:07<00:31,  2.79it/s]
 20%|██        | 22/108 [00:08<00:30,  2.80it/s]
 21%|██▏       | 23/108 [00:08<00:30,  2.80it/s]
 22%|██▏       | 24/108 [00:08<00:30,  2.80it/s]
 23%|██▎       | 25/108 [00:09<00:29,  2.81it/s]
 24%|██▍       | 26/108 [00:09<00:29,  2.81it/s]


== Status ==
Current time: 2024-03-07 21:34:56 (running for 00:09:45.80)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (8 PENDING, 1 RUNNING, 6 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00006 | RUNNING    | 172.19.0.1:9810 |     1.90102e-06 |  

 25%|██▌       | 27/108 [00:09<00:28,  2.80it/s]
 26%|██▌       | 28/108 [00:10<00:28,  2.80it/s]
 27%|██▋       | 29/108 [00:10<00:28,  2.81it/s]
 28%|██▊       | 30/108 [00:10<00:27,  2.80it/s]
 29%|██▊       | 31/108 [00:11<00:27,  2.81it/s]
 30%|██▉       | 32/108 [00:11<00:27,  2.80it/s]
 31%|███       | 33/108 [00:11<00:26,  2.80it/s]
 31%|███▏      | 34/108 [00:12<00:26,  2.80it/s]
 32%|███▏      | 35/108 [00:12<00:25,  2.81it/s]
 33%|███▎      | 36/108 [00:12<00:24,  2.91it/s]
[36m(_objective pid=9810)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=9810)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.62it/s][A
[36m(_objective pid=9810)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.34it/s][A
[36m(_objective pid=9810)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.67it/s][A


[36m(_objective pid=9810)[0m {'eval_loss': 0.6912899613380432, 'eval_accuracy': 0.5949367088607594, 'eval_runtime': 1.2951, 'eval_samples_per_second': 61.001, 'eval_steps_per_second': 3.861, 'epoch': 1.0}


[36m(_objective pid=9810)[0m 
                                                
 33%|███▎      | 36/108 [00:14<00:24,  2.91it/s]
100%|██████████| 5/5 [00:01<00:00,  4.49it/s][A
                                             [A
 34%|███▍      | 37/108 [00:14<00:52,  1.35it/s]


== Status ==
Current time: 2024-03-07 21:35:01 (running for 00:09:50.85)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (8 PENDING, 1 RUNNING, 6 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00006 | RUNNING    | 172.19.0.1:9810 |     1.90102e-06 |  

 35%|███▌      | 38/108 [00:14<00:43,  1.60it/s]
 36%|███▌      | 39/108 [00:15<00:37,  1.83it/s]
 37%|███▋      | 40/108 [00:15<00:33,  2.03it/s]
 38%|███▊      | 41/108 [00:16<00:30,  2.21it/s]
 39%|███▉      | 42/108 [00:16<00:27,  2.37it/s]
 40%|███▉      | 43/108 [00:16<00:26,  2.48it/s]
 41%|████      | 44/108 [00:17<00:24,  2.57it/s]
 42%|████▏     | 45/108 [00:17<00:23,  2.64it/s]
 43%|████▎     | 46/108 [00:17<00:23,  2.68it/s]
 44%|████▎     | 47/108 [00:18<00:22,  2.72it/s]
 44%|████▍     | 48/108 [00:18<00:21,  2.74it/s]
 45%|████▌     | 49/108 [00:18<00:21,  2.76it/s]
 46%|████▋     | 50/108 [00:19<00:20,  2.77it/s]
 47%|████▋     | 51/108 [00:19<00:20,  2.78it/s]


== Status ==
Current time: 2024-03-07 21:35:06 (running for 00:09:55.89)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (8 PENDING, 1 RUNNING, 6 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00006 | RUNNING    | 172.19.0.1:9810 |     1.90102e-06 |  

 48%|████▊     | 52/108 [00:20<00:20,  2.79it/s]
 49%|████▉     | 53/108 [00:20<00:19,  2.80it/s]
 50%|█████     | 54/108 [00:20<00:19,  2.80it/s]
 51%|█████     | 55/108 [00:21<00:18,  2.79it/s]
 52%|█████▏    | 56/108 [00:21<00:18,  2.80it/s]
 53%|█████▎    | 57/108 [00:21<00:18,  2.79it/s]
 54%|█████▎    | 58/108 [00:22<00:17,  2.80it/s]
 55%|█████▍    | 59/108 [00:22<00:20,  2.40it/s]
 56%|█████▌    | 60/108 [00:23<00:19,  2.52it/s]
 56%|█████▋    | 61/108 [00:23<00:18,  2.60it/s]
 57%|█████▋    | 62/108 [00:23<00:17,  2.65it/s]
 58%|█████▊    | 63/108 [00:24<00:16,  2.69it/s]
 59%|█████▉    | 64/108 [00:24<00:16,  2.73it/s]
 60%|██████    | 65/108 [00:24<00:15,  2.74it/s]


== Status ==
Current time: 2024-03-07 21:35:11 (running for 00:10:00.93)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (8 PENDING, 1 RUNNING, 6 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00006 | RUNNING    | 172.19.0.1:9810 |     1.90102e-06 |  

 61%|██████    | 66/108 [00:25<00:15,  2.76it/s]
 62%|██████▏   | 67/108 [00:25<00:14,  2.78it/s]
 63%|██████▎   | 68/108 [00:25<00:14,  2.78it/s]
 64%|██████▍   | 69/108 [00:26<00:13,  2.79it/s]
 65%|██████▍   | 70/108 [00:26<00:13,  2.79it/s]
 66%|██████▌   | 71/108 [00:26<00:13,  2.79it/s]
 67%|██████▋   | 72/108 [00:27<00:12,  2.89it/s]
[36m(_objective pid=9810)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=9810)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.55it/s][A
[36m(_objective pid=9810)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.35it/s][A
[36m(_objective pid=9810)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.64it/s][A


[36m(_objective pid=9810)[0m {'eval_loss': 0.6935284733772278, 'eval_accuracy': 0.4936708860759494, 'eval_runtime': 1.3003, 'eval_samples_per_second': 60.756, 'eval_steps_per_second': 3.845, 'epoch': 2.0}


[36m(_objective pid=9810)[0m 
                                                
 67%|██████▋   | 72/108 [00:28<00:12,  2.89it/s]
100%|██████████| 5/5 [00:01<00:00,  4.47it/s][A
                                             [A
 68%|██████▊   | 73/108 [00:28<00:26,  1.34it/s]
 69%|██████▊   | 74/108 [00:29<00:21,  1.59it/s]
 69%|██████▉   | 75/108 [00:29<00:18,  1.83it/s]


== Status ==
Current time: 2024-03-07 21:35:16 (running for 00:10:05.98)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (8 PENDING, 1 RUNNING, 6 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00006 | RUNNING    | 172.19.0.1:9810 |     1.90102e-06 |  

 70%|███████   | 76/108 [00:30<00:15,  2.05it/s]
 71%|███████▏  | 77/108 [00:30<00:13,  2.22it/s]
 72%|███████▏  | 78/108 [00:30<00:12,  2.37it/s]
 73%|███████▎  | 79/108 [00:31<00:11,  2.49it/s]
 74%|███████▍  | 80/108 [00:31<00:10,  2.58it/s]
 75%|███████▌  | 81/108 [00:31<00:10,  2.63it/s]
 76%|███████▌  | 82/108 [00:32<00:09,  2.68it/s]
 77%|███████▋  | 83/108 [00:32<00:09,  2.73it/s]
 78%|███████▊  | 84/108 [00:32<00:08,  2.74it/s]
 79%|███████▊  | 85/108 [00:33<00:08,  2.76it/s]
 80%|███████▉  | 86/108 [00:33<00:07,  2.77it/s]
 81%|████████  | 87/108 [00:33<00:07,  2.78it/s]
 81%|████████▏ | 88/108 [00:34<00:07,  2.79it/s]
 82%|████████▏ | 89/108 [00:34<00:06,  2.79it/s]


== Status ==
Current time: 2024-03-07 21:35:21 (running for 00:10:11.03)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (8 PENDING, 1 RUNNING, 6 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00006 | RUNNING    | 172.19.0.1:9810 |     1.90102e-06 |  

 83%|████████▎ | 90/108 [00:35<00:06,  2.79it/s]
 84%|████████▍ | 91/108 [00:35<00:06,  2.79it/s]
 85%|████████▌ | 92/108 [00:35<00:05,  2.80it/s]
 86%|████████▌ | 93/108 [00:36<00:05,  2.79it/s]
 87%|████████▋ | 94/108 [00:36<00:05,  2.80it/s]
 88%|████████▊ | 95/108 [00:36<00:04,  2.79it/s]
 89%|████████▉ | 96/108 [00:37<00:04,  2.80it/s]
 90%|████████▉ | 97/108 [00:37<00:03,  2.80it/s]
 91%|█████████ | 98/108 [00:37<00:03,  2.80it/s]
 92%|█████████▏| 99/108 [00:38<00:03,  2.81it/s]
 93%|█████████▎| 100/108 [00:38<00:02,  2.80it/s]
 94%|█████████▎| 101/108 [00:38<00:02,  2.79it/s]
 94%|█████████▍| 102/108 [00:39<00:02,  2.80it/s]
 95%|█████████▌| 103/108 [00:39<00:01,  2.80it/s]
 96%|█████████▋| 104/108 [00:40<00:01,  2.80it/s]


== Status ==
Current time: 2024-03-07 21:35:26 (running for 00:10:16.07)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (8 PENDING, 1 RUNNING, 6 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00006 | RUNNING    | 172.19.0.1:9810 |     1.90102e-06 |  

 97%|█████████▋| 105/108 [00:40<00:01,  2.80it/s]
 98%|█████████▊| 106/108 [00:40<00:00,  2.80it/s]
 99%|█████████▉| 107/108 [00:41<00:00,  2.80it/s]
100%|██████████| 108/108 [00:41<00:00,  2.90it/s]
[36m(_objective pid=9810)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=9810)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.44it/s][A
[36m(_objective pid=9810)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.31it/s][A
[36m(_objective pid=9810)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.65it/s][A


[36m(_objective pid=9810)[0m {'eval_loss': 0.6913886666297913, 'eval_accuracy': 0.5569620253164557, 'eval_runtime': 1.304, 'eval_samples_per_second': 60.585, 'eval_steps_per_second': 3.834, 'epoch': 3.0}
[36m(_objective pid=9810)[0m {'train_runtime': 42.7397, 'train_samples_per_second': 20.145, 'train_steps_per_second': 2.527, 'train_loss': 0.6902463701036241, 'epoch': 3.0}


[36m(_objective pid=9810)[0m 
                                                 
100%|██████████| 108/108 [00:42<00:00,  2.90it/s]
100%|██████████| 5/5 [00:01<00:00,  4.46it/s][A
100%|██████████| 108/108 [00:42<00:00,  2.53it/s]


== Status ==
Current time: 2024-03-07 21:35:32 (running for 00:10:21.14)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (8 PENDING, 7 TERMINATED)
+------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc             |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                 |                 |                    |                ch_size |                |             |
|------------------------+------------+-----------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00007 | PENDING    |                 |     1.72493e-05 |             

[36m(_objective pid=10009)[0m 2024-03-07 21:35:35.648792: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=10009)[0m 2024-03-07 21:35:35.648845: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=10009)[0m 2024-03-07 21:35:35.650222: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered


== Status ==
Current time: 2024-03-07 21:35:37 (running for 00:10:26.21)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (7 PENDING, 1 RUNNING, 7 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00007 | RUNNING    | 172.19.0.1:10009 |     1.72493e-0

[36m(_objective pid=10009)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
[36m(_objective pid=10009)[0m You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
  0%|          | 0/36 [00:00<?, ?it/s]
  3%|▎         | 1/36 [00:00<00:20,  1.72it/s]
  6%|▌         | 2/36 [00:00<00:14,  2.28it/s]
  8%|▊         | 3/36 [00:01<00:13,  2.49it/s]
 11%|█         | 4/36 [00:01<00:12,  2.60it/s]
 14%|█▍        | 5/36 [00:01<00:11,  2.68it/s]
 17%|█▋        | 6/36 [00:02<00:11,  2.72it/s]
 19%|█▉        | 7/36 [00:02<00:10,  2.75it/s]
 22%|██▏       | 8/36 [00:03<00:10,  2.76it/s]


== Status ==
Current time: 2024-03-07 21:35:42 (running for 00:10:31.25)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (7 PENDING, 1 RUNNING, 7 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00007 | RUNNING    | 172.19.0.1:10009 |     1.72493e-0

 25%|██▌       | 9/36 [00:03<00:09,  2.79it/s]
 28%|██▊       | 10/36 [00:03<00:09,  2.79it/s]
 31%|███       | 11/36 [00:04<00:08,  2.80it/s]
 33%|███▎      | 12/36 [00:04<00:08,  2.80it/s]
 36%|███▌      | 13/36 [00:04<00:08,  2.80it/s]
 39%|███▉      | 14/36 [00:05<00:07,  2.81it/s]
 42%|████▏     | 15/36 [00:05<00:07,  2.81it/s]
 44%|████▍     | 16/36 [00:05<00:07,  2.81it/s]
 47%|████▋     | 17/36 [00:06<00:06,  2.80it/s]
 50%|█████     | 18/36 [00:06<00:06,  2.80it/s]
 53%|█████▎    | 19/36 [00:06<00:06,  2.80it/s]
 56%|█████▌    | 20/36 [00:07<00:05,  2.80it/s]
 58%|█████▊    | 21/36 [00:07<00:05,  2.81it/s]
 61%|██████    | 22/36 [00:08<00:04,  2.80it/s]


== Status ==
Current time: 2024-03-07 21:35:47 (running for 00:10:36.29)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (7 PENDING, 1 RUNNING, 7 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00007 | RUNNING    | 172.19.0.1:10009 |     1.72493e-0

 64%|██████▍   | 23/36 [00:08<00:04,  2.81it/s]
 67%|██████▋   | 24/36 [00:08<00:04,  2.80it/s]
 69%|██████▉   | 25/36 [00:09<00:03,  2.81it/s]
 72%|███████▏  | 26/36 [00:09<00:03,  2.80it/s]
 75%|███████▌  | 27/36 [00:09<00:03,  2.80it/s]
 78%|███████▊  | 28/36 [00:10<00:02,  2.81it/s]
 81%|████████  | 29/36 [00:10<00:02,  2.81it/s]
 83%|████████▎ | 30/36 [00:10<00:02,  2.80it/s]
 86%|████████▌ | 31/36 [00:11<00:01,  2.80it/s]
 89%|████████▉ | 32/36 [00:11<00:01,  2.80it/s]
 92%|█████████▏| 33/36 [00:11<00:01,  2.80it/s]
 94%|█████████▍| 34/36 [00:12<00:00,  2.81it/s]
 97%|█████████▋| 35/36 [00:12<00:00,  2.81it/s]
100%|██████████| 36/36 [00:12<00:00,  2.90it/s]
[36m(_objective pid=10009)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A


== Status ==
Current time: 2024-03-07 21:35:52 (running for 00:10:41.34)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (7 PENDING, 1 RUNNING, 7 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00007 | RUNNING    | 172.19.0.1:10009 |     1.72493e-0

[36m(_objective pid=10009)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.59it/s][A
[36m(_objective pid=10009)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.38it/s][A
[36m(_objective pid=10009)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.68it/s][A
[36m(_objective pid=10009)[0m 
                                               A
100%|██████████| 36/36 [00:14<00:00,  2.90it/s]
100%|██████████| 5/5 [00:01<00:00,  4.50it/s][A
100%|██████████| 36/36 [00:14<00:00,  2.52it/s]A


[36m(_objective pid=10009)[0m {'eval_loss': 0.686077356338501, 'eval_accuracy': 0.5949367088607594, 'eval_runtime': 1.2951, 'eval_samples_per_second': 60.998, 'eval_steps_per_second': 3.861, 'epoch': 1.0}
[36m(_objective pid=10009)[0m {'train_runtime': 14.3112, 'train_samples_per_second': 20.054, 'train_steps_per_second': 2.516, 'train_loss': 0.695738262600369, 'epoch': 1.0}
== Status ==
Current time: 2024-03-07 21:35:57 (running for 00:10:46.36)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (7 PENDING, 8 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|         

[36m(_objective pid=10128)[0m 2024-03-07 21:35:58.665500: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=10128)[0m 2024-03-07 21:35:58.665555: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=10128)[0m 2024-03-07 21:35:58.666899: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
[36m(_objective pid=10128)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weig

== Status ==
Current time: 2024-03-07 21:36:02 (running for 00:10:51.46)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (6 PENDING, 1 RUNNING, 8 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00008 | RUNNING    | 172.19.0.1:10128 |     1.64093e-0

  2%|▏         | 5/287 [00:00<00:26, 10.52it/s]
  2%|▏         | 7/287 [00:00<00:23, 11.74it/s]
  3%|▎         | 9/287 [00:00<00:22, 12.39it/s]
  4%|▍         | 11/287 [00:00<00:21, 12.90it/s]
  5%|▍         | 13/287 [00:01<00:20, 13.24it/s]
  5%|▌         | 15/287 [00:01<00:20, 13.43it/s]
  6%|▌         | 17/287 [00:01<00:19, 13.61it/s]
  7%|▋         | 19/287 [00:01<00:19, 13.75it/s]
  7%|▋         | 21/287 [00:01<00:19, 13.81it/s]
  8%|▊         | 23/287 [00:01<00:19, 13.76it/s]
  9%|▊         | 25/287 [00:01<00:18, 13.83it/s]
  9%|▉         | 27/287 [00:02<00:18, 13.87it/s]
 10%|█         | 29/287 [00:02<00:18, 13.91it/s]
 11%|█         | 31/287 [00:02<00:18, 13.94it/s]
 11%|█▏        | 33/287 [00:02<00:18, 13.92it/s]
 12%|█▏        | 35/287 [00:02<00:18, 13.92it/s]
 13%|█▎        | 37/287 [00:02<00:18, 13.87it/s]
 14%|█▎        | 39/287 [00:02<00:17, 13.91it/s]
 14%|█▍        | 41/287 [00:03<00:17, 13.93it/s]
 15%|█▍        | 43/287 [00:03<00:17, 13.95it/s]
 16%|█▌        | 45/287

== Status ==
Current time: 2024-03-07 21:36:07 (running for 00:10:56.50)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (6 PENDING, 1 RUNNING, 8 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00008 | RUNNING    | 172.19.0.1:10128 |     1.64093e-0

 27%|██▋       | 77/287 [00:05<00:15, 13.94it/s]
 28%|██▊       | 79/287 [00:05<00:14, 13.88it/s]
 28%|██▊       | 81/287 [00:06<00:14, 13.88it/s]
 29%|██▉       | 83/287 [00:06<00:14, 13.92it/s]
 30%|██▉       | 85/287 [00:06<00:14, 13.94it/s]
 30%|███       | 87/287 [00:06<00:14, 13.96it/s]
 31%|███       | 89/287 [00:06<00:14, 13.98it/s]
 32%|███▏      | 91/287 [00:06<00:14, 13.95it/s]
 32%|███▏      | 93/287 [00:06<00:13, 13.91it/s]
 33%|███▎      | 95/287 [00:07<00:13, 13.94it/s]
 34%|███▍      | 97/287 [00:07<00:13, 13.92it/s]
 34%|███▍      | 99/287 [00:07<00:13, 13.96it/s]
 35%|███▌      | 101/287 [00:07<00:13, 13.95it/s]
 36%|███▌      | 103/287 [00:07<00:13, 13.99it/s]
 37%|███▋      | 105/287 [00:07<00:13, 13.95it/s]
 37%|███▋      | 107/287 [00:07<00:12, 13.88it/s]
 38%|███▊      | 109/287 [00:08<00:12, 13.93it/s]
 39%|███▊      | 111/287 [00:08<00:12, 13.96it/s]
 39%|███▉      | 113/287 [00:08<00:12, 13.91it/s]
 40%|████      | 115/287 [00:08<00:12, 13.92it/s]
 41%|████   

== Status ==
Current time: 2024-03-07 21:36:12 (running for 00:11:01.55)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (6 PENDING, 1 RUNNING, 8 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00008 | RUNNING    | 172.19.0.1:10128 |     1.64093e-0

 51%|█████     | 147/287 [00:10<00:10, 13.92it/s]
 52%|█████▏    | 149/287 [00:10<00:09, 13.90it/s]
 53%|█████▎    | 151/287 [00:11<00:09, 13.94it/s]
 53%|█████▎    | 153/287 [00:11<00:09, 13.93it/s]
 54%|█████▍    | 155/287 [00:11<00:09, 13.94it/s]
 55%|█████▍    | 157/287 [00:11<00:09, 13.95it/s]
 55%|█████▌    | 159/287 [00:11<00:09, 13.95it/s]
 56%|█████▌    | 161/287 [00:11<00:09, 13.96it/s]
 57%|█████▋    | 163/287 [00:11<00:08, 13.86it/s]
 57%|█████▋    | 165/287 [00:12<00:08, 13.91it/s]
 58%|█████▊    | 167/287 [00:12<00:08, 13.93it/s]
 59%|█████▉    | 169/287 [00:12<00:08, 13.93it/s]
 60%|█████▉    | 171/287 [00:12<00:08, 13.95it/s]
 60%|██████    | 173/287 [00:12<00:08, 13.97it/s]
 61%|██████    | 175/287 [00:12<00:08, 13.97it/s]
 62%|██████▏   | 177/287 [00:12<00:07, 13.93it/s]
 62%|██████▏   | 179/287 [00:13<00:07, 13.91it/s]
 63%|██████▎   | 181/287 [00:13<00:07, 13.93it/s]
 64%|██████▍   | 183/287 [00:13<00:07, 13.93it/s]
 64%|██████▍   | 185/287 [00:13<00:07, 13.95it/s]


== Status ==
Current time: 2024-03-07 21:36:17 (running for 00:11:06.59)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (6 PENDING, 1 RUNNING, 8 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00008 | RUNNING    | 172.19.0.1:10128 |     1.64093e-0

 76%|███████▌  | 217/287 [00:15<00:05, 13.97it/s]
 76%|███████▋  | 219/287 [00:15<00:04, 13.88it/s]
 77%|███████▋  | 221/287 [00:16<00:04, 13.90it/s]
 78%|███████▊  | 223/287 [00:16<00:04, 13.93it/s]
 78%|███████▊  | 225/287 [00:16<00:04, 13.89it/s]
 79%|███████▉  | 227/287 [00:16<00:04, 13.93it/s]
 80%|███████▉  | 229/287 [00:16<00:04, 13.94it/s]
 80%|████████  | 231/287 [00:16<00:04, 13.96it/s]
 81%|████████  | 233/287 [00:16<00:03, 13.90it/s]
 82%|████████▏ | 235/287 [00:17<00:03, 13.92it/s]
 83%|████████▎ | 237/287 [00:17<00:03, 13.94it/s]
 83%|████████▎ | 239/287 [00:17<00:03, 13.96it/s]
 84%|████████▍ | 241/287 [00:17<00:03, 13.94it/s]
 85%|████████▍ | 243/287 [00:17<00:03, 13.97it/s]
 85%|████████▌ | 245/287 [00:17<00:03, 13.98it/s]
 86%|████████▌ | 247/287 [00:17<00:02, 13.89it/s]
 87%|████████▋ | 249/287 [00:18<00:02, 13.91it/s]
 87%|████████▋ | 251/287 [00:18<00:02, 13.93it/s]
 88%|████████▊ | 253/287 [00:18<00:02, 13.95it/s]
 89%|████████▉ | 255/287 [00:18<00:02, 13.98it/s]


== Status ==
Current time: 2024-03-07 21:36:22 (running for 00:11:11.63)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (6 PENDING, 1 RUNNING, 8 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00008 | RUNNING    | 172.19.0.1:10128 |     1.64093e-0

[36m(_objective pid=10128)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=10128)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.70it/s][A
[36m(_objective pid=10128)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.39it/s][A
[36m(_objective pid=10128)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.65it/s][A


[36m(_objective pid=10128)[0m {'eval_loss': 0.6764014363288879, 'eval_accuracy': 0.5949367088607594, 'eval_runtime': 1.307, 'eval_samples_per_second': 60.444, 'eval_steps_per_second': 3.826, 'epoch': 1.0}
[36m(_objective pid=10128)[0m {'train_runtime': 22.1217, 'train_samples_per_second': 12.974, 'train_steps_per_second': 12.974, 'train_loss': 0.745698829145797, 'epoch': 1.0}


[36m(_objective pid=10128)[0m 
                                                 
100%|██████████| 287/287 [00:22<00:00, 13.96it/s]
100%|██████████| 5/5 [00:01<00:00,  4.47it/s][A
100%|██████████| 287/287 [00:22<00:00, 12.97it/s]


== Status ==
Current time: 2024-03-07 21:36:27 (running for 00:11:16.73)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (6 PENDING, 9 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00009 | PENDING    |                  |     7.90262e-05 |        

[36m(_objective pid=10255)[0m 2024-03-07 21:36:29.596149: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=10255)[0m 2024-03-07 21:36:29.596206: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=10255)[0m 2024-03-07 21:36:29.597563: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
[36m(_objective pid=10255)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weig

== Status ==
Current time: 2024-03-07 21:36:32 (running for 00:11:21.79)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (5 PENDING, 1 RUNNING, 9 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00009 | RUNNING    | 172.19.0.1:10255 |     7.90262e-0

  0%|          | 1/216 [00:00<01:28,  2.43it/s]
  1%|          | 2/216 [00:00<00:58,  3.63it/s]
  1%|▏         | 3/216 [00:00<00:50,  4.22it/s]
  2%|▏         | 4/216 [00:00<00:46,  4.54it/s]
  2%|▏         | 5/216 [00:01<00:44,  4.76it/s]
  3%|▎         | 6/216 [00:01<00:42,  4.91it/s]
  3%|▎         | 7/216 [00:01<00:41,  5.00it/s]
  4%|▎         | 8/216 [00:01<00:41,  5.05it/s]
  4%|▍         | 9/216 [00:01<00:40,  5.08it/s]
  5%|▍         | 10/216 [00:02<00:40,  5.11it/s]
  5%|▌         | 11/216 [00:02<00:39,  5.14it/s]
  6%|▌         | 12/216 [00:02<00:39,  5.16it/s]
  6%|▌         | 13/216 [00:02<00:39,  5.18it/s]
  6%|▋         | 14/216 [00:02<00:39,  5.17it/s]
  7%|▋         | 15/216 [00:03<00:38,  5.16it/s]
  7%|▋         | 16/216 [00:03<00:38,  5.16it/s]
  8%|▊         | 17/216 [00:03<00:38,  5.17it/s]
  8%|▊         | 18/216 [00:03<00:38,  5.18it/s]
  9%|▉         | 19/216 [00:03<00:37,  5.19it/s]
  9%|▉         | 20/216 [00:04<00:37,  5.16it/s]
 10%|▉         | 21/216 [00:0

== Status ==
Current time: 2024-03-07 21:36:37 (running for 00:11:26.84)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (5 PENDING, 1 RUNNING, 9 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00009 | RUNNING    | 172.19.0.1:10255 |     7.90262e-0

 12%|█▏        | 25/216 [00:05<00:36,  5.17it/s]
 12%|█▏        | 26/216 [00:05<00:36,  5.19it/s]
 12%|█▎        | 27/216 [00:05<00:36,  5.19it/s]
 13%|█▎        | 28/216 [00:05<00:36,  5.19it/s]
 13%|█▎        | 29/216 [00:05<00:36,  5.18it/s]
 14%|█▍        | 30/216 [00:05<00:36,  5.17it/s]
 14%|█▍        | 31/216 [00:06<00:35,  5.16it/s]
 15%|█▍        | 32/216 [00:06<00:35,  5.16it/s]
 15%|█▌        | 33/216 [00:06<00:35,  5.18it/s]
 16%|█▌        | 34/216 [00:06<00:35,  5.19it/s]
 16%|█▌        | 35/216 [00:06<00:34,  5.18it/s]
 17%|█▋        | 36/216 [00:07<00:34,  5.19it/s]
 17%|█▋        | 37/216 [00:07<00:34,  5.18it/s]
 18%|█▊        | 38/216 [00:07<00:34,  5.19it/s]
 18%|█▊        | 39/216 [00:07<00:34,  5.20it/s]
 19%|█▊        | 40/216 [00:07<00:33,  5.18it/s]
 19%|█▉        | 41/216 [00:08<00:33,  5.19it/s]
 19%|█▉        | 42/216 [00:08<00:33,  5.19it/s]
 20%|█▉        | 43/216 [00:08<00:33,  5.18it/s]
 20%|██        | 44/216 [00:08<00:33,  5.18it/s]
 21%|██        | 45/

== Status ==
Current time: 2024-03-07 21:36:42 (running for 00:11:31.89)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (5 PENDING, 1 RUNNING, 9 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00009 | RUNNING    | 172.19.0.1:10255 |     7.90262e-0

 24%|██▍       | 52/216 [00:10<00:31,  5.19it/s]
 25%|██▍       | 53/216 [00:10<00:31,  5.20it/s]
 25%|██▌       | 54/216 [00:10<00:31,  5.20it/s]
 25%|██▌       | 55/216 [00:10<00:30,  5.20it/s]
 26%|██▌       | 56/216 [00:11<00:30,  5.16it/s]
 26%|██▋       | 57/216 [00:11<00:30,  5.18it/s]
 27%|██▋       | 58/216 [00:11<00:30,  5.17it/s]
 27%|██▋       | 59/216 [00:11<00:30,  5.17it/s]
 28%|██▊       | 60/216 [00:11<00:30,  5.19it/s]
 28%|██▊       | 61/216 [00:11<00:29,  5.17it/s]
 29%|██▊       | 62/216 [00:12<00:29,  5.18it/s]
 29%|██▉       | 63/216 [00:12<00:29,  5.19it/s]
 30%|██▉       | 64/216 [00:12<00:29,  5.19it/s]
 30%|███       | 65/216 [00:12<00:29,  5.20it/s]
 31%|███       | 66/216 [00:12<00:29,  5.16it/s]
 31%|███       | 67/216 [00:13<00:28,  5.16it/s]
 31%|███▏      | 68/216 [00:13<00:28,  5.18it/s]
 32%|███▏      | 69/216 [00:13<00:28,  5.19it/s]
 32%|███▏      | 70/216 [00:13<00:28,  5.19it/s]
 33%|███▎      | 71/216 [00:13<00:27,  5.19it/s]
 33%|███▎      | 72/

== Status ==
Current time: 2024-03-07 21:36:47 (running for 00:11:36.93)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (5 PENDING, 1 RUNNING, 9 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00009 | RUNNING    | 172.19.0.1:10255 |     7.90262e-0

[36m(_objective pid=10255)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.65it/s][A


[36m(_objective pid=10255)[0m {'eval_loss': 0.6811774969100952, 'eval_accuracy': 0.5822784810126582, 'eval_runtime': 1.2997, 'eval_samples_per_second': 60.782, 'eval_steps_per_second': 3.847, 'epoch': 1.0}


[36m(_objective pid=10255)[0m 
                                                
 33%|███▎      | 72/216 [00:15<00:26,  5.48it/s]
100%|██████████| 5/5 [00:01<00:00,  4.47it/s][A
                                             [A
 34%|███▍      | 73/216 [00:15<01:22,  1.73it/s]
 34%|███▍      | 74/216 [00:15<01:05,  2.16it/s]
 35%|███▍      | 75/216 [00:15<00:53,  2.61it/s]
 35%|███▌      | 76/216 [00:16<00:45,  3.07it/s]
 36%|███▌      | 77/216 [00:16<00:39,  3.50it/s]
 36%|███▌      | 78/216 [00:16<00:35,  3.86it/s]
 37%|███▋      | 79/216 [00:16<00:32,  4.16it/s]
 37%|███▋      | 80/216 [00:16<00:30,  4.39it/s]
 38%|███▊      | 81/216 [00:17<00:29,  4.61it/s]
 38%|███▊      | 82/216 [00:17<00:28,  4.78it/s]
 38%|███▊      | 83/216 [00:17<00:27,  4.90it/s]
 39%|███▉      | 84/216 [00:17<00:26,  4.96it/s]
 39%|███▉      | 85/216 [00:17<00:26,  5.03it/s]
 40%|███▉      | 86/216 [00:18<00:25,  5.06it/s]
 40%|████      | 87/216 [00:18<00:25,  5.09it/s]
 41%|████      | 88/216 [00:18<00:24

== Status ==
Current time: 2024-03-07 21:36:52 (running for 00:11:41.99)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (5 PENDING, 1 RUNNING, 9 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00009 | RUNNING    | 172.19.0.1:10255 |     7.90262e-0

 45%|████▍     | 97/216 [00:20<00:22,  5.18it/s]
 45%|████▌     | 98/216 [00:20<00:22,  5.18it/s]
 46%|████▌     | 99/216 [00:20<00:22,  5.18it/s]
 46%|████▋     | 100/216 [00:20<00:22,  5.19it/s]
 47%|████▋     | 101/216 [00:20<00:22,  5.17it/s]
 47%|████▋     | 102/216 [00:21<00:22,  5.17it/s]
 48%|████▊     | 103/216 [00:21<00:21,  5.19it/s]
 48%|████▊     | 104/216 [00:21<00:21,  5.19it/s]
 49%|████▊     | 105/216 [00:21<00:21,  5.20it/s]
 49%|████▉     | 106/216 [00:21<00:21,  5.19it/s]
 50%|████▉     | 107/216 [00:22<00:21,  5.14it/s]
 50%|█████     | 108/216 [00:22<00:20,  5.15it/s]
 50%|█████     | 109/216 [00:22<00:20,  5.17it/s]
 51%|█████     | 110/216 [00:22<00:20,  5.19it/s]
 51%|█████▏    | 111/216 [00:22<00:20,  5.17it/s]
 52%|█████▏    | 112/216 [00:23<00:20,  5.17it/s]
 52%|█████▏    | 113/216 [00:23<00:19,  5.15it/s]
 53%|█████▎    | 114/216 [00:23<00:19,  5.11it/s]
 53%|█████▎    | 115/216 [00:23<00:19,  5.13it/s]
 54%|█████▎    | 116/216 [00:23<00:19,  5.15it/s]
 54

== Status ==
Current time: 2024-03-07 21:36:57 (running for 00:11:47.03)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (5 PENDING, 1 RUNNING, 9 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00009 | RUNNING    | 172.19.0.1:10255 |     7.90262e-0

 57%|█████▋    | 123/216 [00:25<00:17,  5.19it/s]
 57%|█████▋    | 124/216 [00:25<00:17,  5.20it/s]
 58%|█████▊    | 125/216 [00:25<00:17,  5.21it/s]
 58%|█████▊    | 126/216 [00:25<00:17,  5.20it/s]
 59%|█████▉    | 127/216 [00:26<00:17,  5.15it/s]
 59%|█████▉    | 128/216 [00:26<00:17,  5.16it/s]
 60%|█████▉    | 129/216 [00:26<00:16,  5.17it/s]
 60%|██████    | 130/216 [00:26<00:16,  5.18it/s]
 61%|██████    | 131/216 [00:26<00:16,  5.19it/s]
 61%|██████    | 132/216 [00:26<00:16,  5.15it/s]
 62%|██████▏   | 133/216 [00:27<00:16,  5.17it/s]
 62%|██████▏   | 134/216 [00:27<00:15,  5.18it/s]
 62%|██████▎   | 135/216 [00:27<00:15,  5.19it/s]
 63%|██████▎   | 136/216 [00:27<00:15,  5.20it/s]
 63%|██████▎   | 137/216 [00:27<00:15,  5.18it/s]
 64%|██████▍   | 138/216 [00:28<00:15,  5.18it/s]
 64%|██████▍   | 139/216 [00:28<00:14,  5.19it/s]
 65%|██████▍   | 140/216 [00:28<00:14,  5.20it/s]
 65%|██████▌   | 141/216 [00:28<00:14,  5.19it/s]
 66%|██████▌   | 142/216 [00:28<00:14,  5.18it/s]


== Status ==
Current time: 2024-03-07 21:37:02 (running for 00:11:52.07)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (5 PENDING, 1 RUNNING, 9 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00009 | RUNNING    | 172.19.0.1:10255 |     7.90262e-0

[36m(_objective pid=10255)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.70it/s][A


[36m(_objective pid=10255)[0m {'eval_loss': 0.6821705102920532, 'eval_accuracy': 0.5822784810126582, 'eval_runtime': 1.2932, 'eval_samples_per_second': 61.089, 'eval_steps_per_second': 3.866, 'epoch': 2.0}


[36m(_objective pid=10255)[0m 
                                                 
 67%|██████▋   | 144/216 [00:30<00:13,  5.48it/s]
100%|██████████| 5/5 [00:01<00:00,  4.49it/s][A
                                             [A
 67%|██████▋   | 145/216 [00:30<00:40,  1.73it/s]
 68%|██████▊   | 146/216 [00:30<00:32,  2.16it/s]
 68%|██████▊   | 147/216 [00:31<00:26,  2.62it/s]
 69%|██████▊   | 148/216 [00:31<00:22,  3.08it/s]
 69%|██████▉   | 149/216 [00:31<00:19,  3.51it/s]
 69%|██████▉   | 150/216 [00:31<00:16,  3.89it/s]
 70%|██████▉   | 151/216 [00:31<00:15,  4.20it/s]
 70%|███████   | 152/216 [00:32<00:14,  4.44it/s]
 71%|███████   | 153/216 [00:32<00:13,  4.64it/s]
 71%|███████▏  | 154/216 [00:32<00:12,  4.79it/s]
 72%|███████▏  | 155/216 [00:32<00:12,  4.90it/s]
 72%|███████▏  | 156/216 [00:32<00:12,  4.98it/s]
 73%|███████▎  | 157/216 [00:33<00:11,  5.03it/s]
 73%|███████▎  | 158/216 [00:33<00:11,  5.09it/s]
 74%|███████▎  | 159/216 [00:33<00:11,  5.13it/s]
 74%|███████▍  | 16

== Status ==
Current time: 2024-03-07 21:37:08 (running for 00:11:57.17)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (5 PENDING, 1 RUNNING, 9 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00009 | RUNNING    | 172.19.0.1:10255 |     7.90262e-0

 79%|███████▊  | 170/216 [00:35<00:08,  5.17it/s]
 79%|███████▉  | 171/216 [00:35<00:08,  5.17it/s]
 80%|███████▉  | 172/216 [00:35<00:08,  5.17it/s]
 80%|████████  | 173/216 [00:36<00:08,  5.17it/s]
 81%|████████  | 174/216 [00:36<00:08,  5.18it/s]
 81%|████████  | 175/216 [00:36<00:07,  5.19it/s]
 81%|████████▏ | 176/216 [00:36<00:07,  5.20it/s]
 82%|████████▏ | 177/216 [00:36<00:07,  5.18it/s]
 82%|████████▏ | 178/216 [00:37<00:07,  5.19it/s]
 83%|████████▎ | 179/216 [00:37<00:07,  5.18it/s]
 83%|████████▎ | 180/216 [00:37<00:06,  5.18it/s]
 84%|████████▍ | 181/216 [00:37<00:06,  5.18it/s]
 84%|████████▍ | 182/216 [00:37<00:06,  5.17it/s]
 85%|████████▍ | 183/216 [00:38<00:06,  5.16it/s]
 85%|████████▌ | 184/216 [00:38<00:06,  5.17it/s]
 86%|████████▌ | 185/216 [00:38<00:06,  5.17it/s]
 86%|████████▌ | 186/216 [00:38<00:05,  5.18it/s]
 87%|████████▋ | 187/216 [00:38<00:05,  5.20it/s]
 87%|████████▋ | 188/216 [00:39<00:05,  5.18it/s]
 88%|████████▊ | 189/216 [00:39<00:05,  5.19it/s]


== Status ==
Current time: 2024-03-07 21:37:13 (running for 00:12:02.21)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (5 PENDING, 1 RUNNING, 9 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00009 | RUNNING    | 172.19.0.1:10255 |     7.90262e-0

 90%|█████████ | 195/216 [00:40<00:04,  5.17it/s]
 91%|█████████ | 196/216 [00:40<00:03,  5.17it/s]
 91%|█████████ | 197/216 [00:40<00:03,  5.16it/s]
 92%|█████████▏| 198/216 [00:40<00:03,  5.14it/s]
 92%|█████████▏| 199/216 [00:41<00:03,  5.16it/s]
 93%|█████████▎| 200/216 [00:41<00:03,  5.17it/s]
 93%|█████████▎| 201/216 [00:41<00:02,  5.18it/s]
 94%|█████████▎| 202/216 [00:41<00:02,  5.19it/s]
 94%|█████████▍| 203/216 [00:41<00:02,  5.17it/s]
 94%|█████████▍| 204/216 [00:42<00:02,  5.18it/s]
 95%|█████████▍| 205/216 [00:42<00:02,  5.19it/s]
 95%|█████████▌| 206/216 [00:42<00:01,  5.20it/s]
 96%|█████████▌| 207/216 [00:42<00:01,  5.20it/s]
 96%|█████████▋| 208/216 [00:42<00:01,  5.17it/s]
 97%|█████████▋| 209/216 [00:43<00:01,  5.16it/s]
 97%|█████████▋| 210/216 [00:43<00:01,  5.16it/s]
 98%|█████████▊| 211/216 [00:43<00:00,  5.17it/s]
 98%|█████████▊| 212/216 [00:43<00:00,  5.17it/s]
 99%|█████████▊| 213/216 [00:43<00:00,  5.18it/s]
 99%|█████████▉| 214/216 [00:44<00:00,  5.17it/s]


== Status ==
Current time: 2024-03-07 21:37:18 (running for 00:12:07.24)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (5 PENDING, 1 RUNNING, 9 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00009 | RUNNING    | 172.19.0.1:10255 |     7.90262e-0

[36m(_objective pid=10255)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.64it/s][A


[36m(_objective pid=10255)[0m {'eval_loss': 0.6885003447532654, 'eval_accuracy': 0.5822784810126582, 'eval_runtime': 1.2959, 'eval_samples_per_second': 60.962, 'eval_steps_per_second': 3.858, 'epoch': 3.0}
[36m(_objective pid=10255)[0m {'train_runtime': 45.7369, 'train_samples_per_second': 18.825, 'train_steps_per_second': 4.723, 'train_loss': 0.7042249750207972, 'epoch': 3.0}


[36m(_objective pid=10255)[0m 
                                                 
100%|██████████| 216/216 [00:45<00:00,  5.51it/s]
100%|██████████| 5/5 [00:01<00:00,  4.48it/s][A
                                             [A
100%|██████████| 216/216 [00:45<00:00,  4.72it/s]


== Status ==
Current time: 2024-03-07 21:37:23 (running for 00:12:12.26)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (5 PENDING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | PENDING    |                  |     1.0763e-06  |       

[36m(_objective pid=10434)[0m 2024-03-07 21:37:24.651219: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=10434)[0m 2024-03-07 21:37:24.651279: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=10434)[0m 2024-03-07 21:37:24.652619: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
[36m(_objective pid=10434)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weig

== Status ==
Current time: 2024-03-07 21:37:28 (running for 00:12:17.34)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

  0%|          | 1/360 [00:00<02:28,  2.42it/s]
  1%|          | 2/360 [00:00<01:38,  3.62it/s]
  1%|          | 3/360 [00:00<01:25,  4.20it/s]
  1%|          | 4/360 [00:00<01:18,  4.54it/s]
  1%|▏         | 5/360 [00:01<01:14,  4.76it/s]
  2%|▏         | 6/360 [00:01<01:12,  4.91it/s]
  2%|▏         | 7/360 [00:01<01:10,  5.01it/s]
  2%|▏         | 8/360 [00:01<01:09,  5.04it/s]
  2%|▎         | 9/360 [00:01<01:09,  5.02it/s]
  3%|▎         | 10/360 [00:02<01:08,  5.07it/s]
  3%|▎         | 11/360 [00:02<01:08,  5.12it/s]
  3%|▎         | 12/360 [00:02<01:07,  5.14it/s]
  4%|▎         | 13/360 [00:02<01:07,  5.16it/s]
  4%|▍         | 14/360 [00:02<01:07,  5.16it/s]
  4%|▍         | 15/360 [00:03<01:06,  5.17it/s]
  4%|▍         | 16/360 [00:03<01:06,  5.18it/s]
  5%|▍         | 17/360 [00:03<01:06,  5.18it/s]
  5%|▌         | 18/360 [00:03<01:06,  5.18it/s]
  5%|▌         | 19/360 [00:03<01:06,  5.16it/s]
  6%|▌         | 20/360 [00:04<01:05,  5.16it/s]
  6%|▌         | 21/360 [00:0

== Status ==
Current time: 2024-03-07 21:37:33 (running for 00:12:22.39)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

  8%|▊         | 28/360 [00:05<01:03,  5.19it/s]
  8%|▊         | 29/360 [00:05<01:03,  5.18it/s]
  8%|▊         | 30/360 [00:06<01:03,  5.18it/s]
  9%|▊         | 31/360 [00:06<01:03,  5.17it/s]
  9%|▉         | 32/360 [00:06<01:03,  5.15it/s]
  9%|▉         | 33/360 [00:06<01:03,  5.16it/s]
  9%|▉         | 34/360 [00:06<01:03,  5.16it/s]
 10%|▉         | 35/360 [00:06<01:03,  5.15it/s]
 10%|█         | 36/360 [00:07<01:02,  5.17it/s]
 10%|█         | 37/360 [00:07<01:02,  5.18it/s]
 11%|█         | 38/360 [00:07<01:02,  5.19it/s]
 11%|█         | 39/360 [00:07<01:01,  5.19it/s]
 11%|█         | 40/360 [00:07<01:01,  5.18it/s]
 11%|█▏        | 41/360 [00:08<01:01,  5.19it/s]
 12%|█▏        | 42/360 [00:08<01:01,  5.19it/s]
 12%|█▏        | 43/360 [00:08<01:01,  5.19it/s]
 12%|█▏        | 44/360 [00:08<01:00,  5.19it/s]
 12%|█▎        | 45/360 [00:08<01:00,  5.17it/s]
 13%|█▎        | 46/360 [00:09<01:00,  5.17it/s]
 13%|█▎        | 47/360 [00:09<01:00,  5.17it/s]
 13%|█▎        | 48/

== Status ==
Current time: 2024-03-07 21:37:38 (running for 00:12:27.43)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

 15%|█▌        | 54/360 [00:10<00:58,  5.19it/s]
 15%|█▌        | 55/360 [00:10<00:58,  5.17it/s]
 16%|█▌        | 56/360 [00:11<00:58,  5.19it/s]
 16%|█▌        | 57/360 [00:11<00:58,  5.20it/s]
 16%|█▌        | 58/360 [00:11<00:58,  5.20it/s]
 16%|█▋        | 59/360 [00:11<00:57,  5.20it/s]
 17%|█▋        | 60/360 [00:11<00:58,  5.17it/s]
 17%|█▋        | 61/360 [00:11<00:57,  5.16it/s]
 17%|█▋        | 62/360 [00:12<00:57,  5.16it/s]
 18%|█▊        | 63/360 [00:12<00:57,  5.17it/s]
 18%|█▊        | 64/360 [00:12<00:57,  5.17it/s]
 18%|█▊        | 65/360 [00:12<00:56,  5.18it/s]
 18%|█▊        | 66/360 [00:12<00:56,  5.17it/s]
 19%|█▊        | 67/360 [00:13<00:56,  5.17it/s]
 19%|█▉        | 68/360 [00:13<00:56,  5.18it/s]
 19%|█▉        | 69/360 [00:13<00:56,  5.19it/s]
 19%|█▉        | 70/360 [00:13<00:55,  5.20it/s]
 20%|█▉        | 71/360 [00:13<00:55,  5.18it/s]
 20%|██        | 72/360 [00:14<00:52,  5.51it/s]
[36m(_objective pid=10434)[0m 
  0%|          | 0/5 [00:00<?, ?it/s

[36m(_objective pid=10434)[0m {'eval_loss': 0.6905133724212646, 'eval_accuracy': 0.5949367088607594, 'eval_runtime': 1.2978, 'eval_samples_per_second': 60.87, 'eval_steps_per_second': 3.853, 'epoch': 1.0}


[36m(_objective pid=10434)[0m 
                                                
 20%|██        | 72/360 [00:15<00:52,  5.51it/s]
100%|██████████| 5/5 [00:01<00:00,  4.48it/s][A
                                             [A
 20%|██        | 73/360 [00:15<02:45,  1.73it/s]


== Status ==
Current time: 2024-03-07 21:37:43 (running for 00:12:32.49)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

 21%|██        | 74/360 [00:15<02:12,  2.16it/s]
 21%|██        | 75/360 [00:15<01:48,  2.61it/s]
 21%|██        | 76/360 [00:16<01:32,  3.08it/s]
 21%|██▏       | 77/360 [00:16<01:20,  3.51it/s]
 22%|██▏       | 78/360 [00:16<01:12,  3.87it/s]
 22%|██▏       | 79/360 [00:16<01:07,  4.16it/s]
 22%|██▏       | 80/360 [00:16<01:03,  4.40it/s]
 22%|██▎       | 81/360 [00:17<01:00,  4.62it/s]
 23%|██▎       | 82/360 [00:17<00:58,  4.78it/s]
 23%|██▎       | 83/360 [00:17<00:56,  4.90it/s]
 23%|██▎       | 84/360 [00:17<00:55,  4.98it/s]
 24%|██▎       | 85/360 [00:17<00:55,  5.00it/s]
 24%|██▍       | 86/360 [00:18<00:54,  5.05it/s]
 24%|██▍       | 87/360 [00:18<00:53,  5.08it/s]
 24%|██▍       | 88/360 [00:18<00:53,  5.10it/s]
 25%|██▍       | 89/360 [00:18<00:52,  5.12it/s]
 25%|██▌       | 90/360 [00:18<00:52,  5.11it/s]
 25%|██▌       | 91/360 [00:19<00:52,  5.14it/s]
 26%|██▌       | 92/360 [00:19<00:51,  5.16it/s]
 26%|██▌       | 93/360 [00:19<00:51,  5.17it/s]
 26%|██▌       | 94/

== Status ==
Current time: 2024-03-07 21:37:48 (running for 00:12:37.53)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

 28%|██▊       | 99/360 [00:20<00:50,  5.20it/s]
 28%|██▊       | 100/360 [00:20<00:50,  5.18it/s]
 28%|██▊       | 101/360 [00:21<00:50,  5.17it/s]
 28%|██▊       | 102/360 [00:21<00:49,  5.17it/s]
 29%|██▊       | 103/360 [00:21<00:49,  5.18it/s]
 29%|██▉       | 104/360 [00:21<00:49,  5.18it/s]
 29%|██▉       | 105/360 [00:21<00:49,  5.18it/s]
 29%|██▉       | 106/360 [00:21<00:49,  5.17it/s]
 30%|██▉       | 107/360 [00:22<00:48,  5.19it/s]
 30%|███       | 108/360 [00:22<00:48,  5.18it/s]
 30%|███       | 109/360 [00:22<00:48,  5.19it/s]
 31%|███       | 110/360 [00:22<00:48,  5.20it/s]
 31%|███       | 111/360 [00:22<00:48,  5.18it/s]
 31%|███       | 112/360 [00:23<00:47,  5.19it/s]
 31%|███▏      | 113/360 [00:23<00:47,  5.20it/s]
 32%|███▏      | 114/360 [00:23<00:47,  5.19it/s]
 32%|███▏      | 115/360 [00:23<00:47,  5.18it/s]
 32%|███▏      | 116/360 [00:23<00:47,  5.16it/s]
 32%|███▎      | 117/360 [00:24<00:47,  5.16it/s]
 33%|███▎      | 118/360 [00:24<00:46,  5.16it/s]
 

== Status ==
Current time: 2024-03-07 21:37:53 (running for 00:12:42.58)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

 35%|███▌      | 126/360 [00:25<00:45,  5.17it/s]
 35%|███▌      | 127/360 [00:26<00:44,  5.18it/s]
 36%|███▌      | 128/360 [00:26<00:44,  5.18it/s]
 36%|███▌      | 129/360 [00:26<00:44,  5.18it/s]
 36%|███▌      | 130/360 [00:26<00:44,  5.17it/s]
 36%|███▋      | 131/360 [00:26<00:44,  5.14it/s]
 37%|███▋      | 132/360 [00:26<00:44,  5.09it/s]
 37%|███▋      | 133/360 [00:27<00:44,  5.12it/s]
 37%|███▋      | 134/360 [00:27<00:44,  5.13it/s]
 38%|███▊      | 135/360 [00:27<00:43,  5.15it/s]
 38%|███▊      | 136/360 [00:27<00:43,  5.16it/s]
 38%|███▊      | 137/360 [00:27<00:43,  5.14it/s]
 38%|███▊      | 138/360 [00:28<00:43,  5.16it/s]
 39%|███▊      | 139/360 [00:28<00:42,  5.18it/s]
 39%|███▉      | 140/360 [00:28<00:42,  5.19it/s]
 39%|███▉      | 141/360 [00:28<00:42,  5.19it/s]
 39%|███▉      | 142/360 [00:28<00:42,  5.18it/s]
 40%|███▉      | 143/360 [00:29<00:41,  5.20it/s]
 40%|████      | 144/360 [00:29<00:39,  5.52it/s]
[36m(_objective pid=10434)[0m 
  0%|          | 

[36m(_objective pid=10434)[0m {'eval_loss': 0.6924998164176941, 'eval_accuracy': 0.5189873417721519, 'eval_runtime': 1.3022, 'eval_samples_per_second': 60.667, 'eval_steps_per_second': 3.84, 'epoch': 2.0}
== Status ==
Current time: 2024-03-07 21:37:58 (running for 00:12:47.59)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------

[36m(_objective pid=10434)[0m 
                                                 
 40%|████      | 144/360 [00:30<00:39,  5.52it/s]
100%|██████████| 5/5 [00:01<00:00,  4.47it/s][A
                                             [A
 40%|████      | 145/360 [00:30<02:04,  1.73it/s]
 41%|████      | 146/360 [00:30<01:39,  2.16it/s]
 41%|████      | 147/360 [00:31<01:21,  2.62it/s]
 41%|████      | 148/360 [00:31<01:08,  3.08it/s]
 41%|████▏     | 149/360 [00:31<01:00,  3.50it/s]
 42%|████▏     | 150/360 [00:31<00:54,  3.88it/s]
 42%|████▏     | 151/360 [00:31<00:49,  4.19it/s]
 42%|████▏     | 152/360 [00:32<00:46,  4.45it/s]
 42%|████▎     | 153/360 [00:32<00:44,  4.65it/s]
 43%|████▎     | 154/360 [00:32<00:42,  4.81it/s]
 43%|████▎     | 155/360 [00:32<00:41,  4.91it/s]
 43%|████▎     | 156/360 [00:32<00:41,  4.97it/s]
 44%|████▎     | 157/360 [00:33<00:40,  5.02it/s]
 44%|████▍     | 158/360 [00:33<00:39,  5.06it/s]
 44%|████▍     | 159/360 [00:33<00:39,  5.10it/s]
 44%|████▍     | 16

== Status ==
Current time: 2024-03-07 21:38:03 (running for 00:12:52.63)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

 48%|████▊     | 171/360 [00:35<00:36,  5.15it/s]
 48%|████▊     | 172/360 [00:35<00:36,  5.17it/s]
 48%|████▊     | 173/360 [00:36<00:36,  5.17it/s]
 48%|████▊     | 174/360 [00:36<00:35,  5.17it/s]
 49%|████▊     | 175/360 [00:36<00:35,  5.18it/s]
 49%|████▉     | 176/360 [00:36<00:35,  5.18it/s]
 49%|████▉     | 177/360 [00:36<00:35,  5.18it/s]
 49%|████▉     | 178/360 [00:37<00:35,  5.18it/s]
 50%|████▉     | 179/360 [00:37<00:34,  5.19it/s]
 50%|█████     | 180/360 [00:37<00:34,  5.20it/s]
 50%|█████     | 181/360 [00:37<00:34,  5.21it/s]
 51%|█████     | 182/360 [00:37<00:34,  5.18it/s]
 51%|█████     | 183/360 [00:38<00:34,  5.19it/s]
 51%|█████     | 184/360 [00:38<00:33,  5.18it/s]
 51%|█████▏    | 185/360 [00:38<00:33,  5.17it/s]
 52%|█████▏    | 186/360 [00:38<00:33,  5.18it/s]
 52%|█████▏    | 187/360 [00:38<00:33,  5.17it/s]
 52%|█████▏    | 188/360 [00:39<00:33,  5.17it/s]
 52%|█████▎    | 189/360 [00:39<00:33,  5.18it/s]
 53%|█████▎    | 190/360 [00:39<00:32,  5.18it/s]


== Status ==
Current time: 2024-03-07 21:38:08 (running for 00:12:57.68)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

 55%|█████▍    | 197/360 [00:40<00:31,  5.18it/s]
 55%|█████▌    | 198/360 [00:41<00:31,  5.18it/s]
 55%|█████▌    | 199/360 [00:41<00:31,  5.18it/s]
 56%|█████▌    | 200/360 [00:41<00:30,  5.18it/s]
 56%|█████▌    | 201/360 [00:41<00:30,  5.19it/s]
 56%|█████▌    | 202/360 [00:41<00:30,  5.17it/s]
 56%|█████▋    | 203/360 [00:41<00:30,  5.15it/s]
 57%|█████▋    | 204/360 [00:42<00:30,  5.17it/s]
 57%|█████▋    | 205/360 [00:42<00:29,  5.18it/s]
 57%|█████▋    | 206/360 [00:42<00:29,  5.18it/s]
 57%|█████▊    | 207/360 [00:42<00:29,  5.19it/s]
 58%|█████▊    | 208/360 [00:42<00:29,  5.17it/s]
 58%|█████▊    | 209/360 [00:43<00:29,  5.19it/s]
 58%|█████▊    | 210/360 [00:43<00:28,  5.19it/s]
 59%|█████▊    | 211/360 [00:43<00:28,  5.20it/s]
 59%|█████▉    | 212/360 [00:43<00:28,  5.18it/s]
 59%|█████▉    | 213/360 [00:43<00:28,  5.17it/s]
 59%|█████▉    | 214/360 [00:44<00:28,  5.16it/s]
 60%|█████▉    | 215/360 [00:44<00:28,  5.17it/s]
 60%|██████    | 216/360 [00:44<00:26,  5.49it/s]


[36m(_objective pid=10434)[0m {'eval_loss': 0.6895282864570618, 'eval_accuracy': 0.569620253164557, 'eval_runtime': 1.2969, 'eval_samples_per_second': 60.913, 'eval_steps_per_second': 3.855, 'epoch': 3.0}
== Status ==
Current time: 2024-03-07 21:38:13 (running for 00:13:02.76)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------

[36m(_objective pid=10434)[0m 
                                                 
 60%|██████    | 216/360 [00:45<00:26,  5.49it/s]
100%|██████████| 5/5 [00:01<00:00,  4.48it/s][A
                                             [A
 60%|██████    | 217/360 [00:45<01:22,  1.73it/s]
 61%|██████    | 218/360 [00:46<01:05,  2.16it/s]
 61%|██████    | 219/360 [00:46<00:53,  2.62it/s]
 61%|██████    | 220/360 [00:46<00:45,  3.07it/s]
 61%|██████▏   | 221/360 [00:46<00:39,  3.51it/s]
 62%|██████▏   | 222/360 [00:46<00:35,  3.88it/s]
 62%|██████▏   | 223/360 [00:47<00:32,  4.19it/s]
 62%|██████▏   | 224/360 [00:47<00:30,  4.44it/s]
 62%|██████▎   | 225/360 [00:47<00:29,  4.63it/s]
 63%|██████▎   | 226/360 [00:47<00:28,  4.78it/s]
 63%|██████▎   | 227/360 [00:47<00:27,  4.88it/s]
 63%|██████▎   | 228/360 [00:48<00:26,  4.97it/s]
 64%|██████▎   | 229/360 [00:48<00:26,  5.03it/s]
 64%|██████▍   | 230/360 [00:48<00:25,  5.08it/s]
 64%|██████▍   | 231/360 [00:48<00:25,  5.10it/s]
 64%|██████▍   | 23

== Status ==
Current time: 2024-03-07 21:38:18 (running for 00:13:07.80)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

 68%|██████▊   | 243/360 [00:50<00:22,  5.15it/s]
 68%|██████▊   | 244/360 [00:51<00:22,  5.16it/s]
 68%|██████▊   | 245/360 [00:51<00:22,  5.18it/s]
 68%|██████▊   | 246/360 [00:51<00:21,  5.19it/s]
 69%|██████▊   | 247/360 [00:51<00:21,  5.19it/s]
 69%|██████▉   | 248/360 [00:51<00:21,  5.18it/s]
 69%|██████▉   | 249/360 [00:52<00:21,  5.18it/s]
 69%|██████▉   | 250/360 [00:52<00:21,  5.19it/s]
 70%|██████▉   | 251/360 [00:52<00:20,  5.19it/s]
 70%|███████   | 252/360 [00:52<00:20,  5.18it/s]
 70%|███████   | 253/360 [00:52<00:20,  5.17it/s]
 71%|███████   | 254/360 [00:53<00:20,  5.17it/s]
 71%|███████   | 255/360 [00:53<00:20,  5.15it/s]
 71%|███████   | 256/360 [00:53<00:20,  5.15it/s]
 71%|███████▏  | 257/360 [00:53<00:19,  5.16it/s]
 72%|███████▏  | 258/360 [00:53<00:19,  5.14it/s]
 72%|███████▏  | 259/360 [00:54<00:19,  5.16it/s]
 72%|███████▏  | 260/360 [00:54<00:19,  5.18it/s]
 72%|███████▎  | 261/360 [00:54<00:19,  5.19it/s]
 73%|███████▎  | 262/360 [00:54<00:18,  5.20it/s]


== Status ==
Current time: 2024-03-07 21:38:23 (running for 00:13:12.85)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

 75%|███████▍  | 269/360 [00:56<00:17,  5.14it/s]
 75%|███████▌  | 270/360 [00:56<00:17,  5.16it/s]
 75%|███████▌  | 271/360 [00:56<00:17,  5.17it/s]
 76%|███████▌  | 272/360 [00:56<00:17,  5.17it/s]
 76%|███████▌  | 273/360 [00:56<00:16,  5.16it/s]
 76%|███████▌  | 274/360 [00:56<00:16,  5.15it/s]
 76%|███████▋  | 275/360 [00:57<00:16,  5.15it/s]
 77%|███████▋  | 276/360 [00:57<00:16,  5.13it/s]
 77%|███████▋  | 277/360 [00:57<00:16,  5.15it/s]
 77%|███████▋  | 278/360 [00:57<00:15,  5.17it/s]
 78%|███████▊  | 279/360 [00:57<00:16,  5.02it/s]
 78%|███████▊  | 280/360 [00:58<00:15,  5.07it/s]
 78%|███████▊  | 281/360 [00:58<00:15,  5.11it/s]
 78%|███████▊  | 282/360 [00:58<00:15,  5.14it/s]
 79%|███████▊  | 283/360 [00:58<00:14,  5.16it/s]
 79%|███████▉  | 284/360 [00:58<00:14,  5.16it/s]
 79%|███████▉  | 285/360 [00:59<00:14,  5.16it/s]
 79%|███████▉  | 286/360 [00:59<00:14,  5.17it/s]
 80%|███████▉  | 287/360 [00:59<00:14,  5.17it/s]
 80%|████████  | 288/360 [00:59<00:13,  5.49it/s]


== Status ==
Current time: 2024-03-07 21:38:28 (running for 00:13:17.88)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

[36m(_objective pid=10434)[0m 
                                                 
 80%|████████  | 288/360 [01:00<00:13,  5.49it/s]
100%|██████████| 5/5 [00:01<00:00,  4.45it/s][A
                                             [A
 80%|████████  | 289/360 [01:01<00:41,  1.72it/s]
 81%|████████  | 290/360 [01:01<00:32,  2.15it/s]
 81%|████████  | 291/360 [01:01<00:26,  2.61it/s]
 81%|████████  | 292/360 [01:01<00:22,  3.07it/s]
 81%|████████▏ | 293/360 [01:01<00:19,  3.49it/s]
 82%|████████▏ | 294/360 [01:02<00:17,  3.88it/s]
 82%|████████▏ | 295/360 [01:02<00:15,  4.20it/s]
 82%|████████▏ | 296/360 [01:02<00:14,  4.44it/s]
 82%|████████▎ | 297/360 [01:02<00:13,  4.64it/s]
 83%|████████▎ | 298/360 [01:02<00:12,  4.78it/s]
 83%|████████▎ | 299/360 [01:03<00:12,  4.88it/s]
 83%|████████▎ | 300/360 [01:03<00:12,  4.97it/s]
 84%|████████▎ | 301/360 [01:03<00:11,  5.03it/s]
 84%|████████▍ | 302/360 [01:03<00:11,  5.07it/s]
 84%|████████▍ | 303/360 [01:03<00:11,  5.07it/s]
 84%|████████▍ | 30

== Status ==
Current time: 2024-03-07 21:38:33 (running for 00:13:22.93)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

 87%|████████▋ | 314/360 [01:06<00:08,  5.14it/s]
 88%|████████▊ | 315/360 [01:06<00:08,  5.14it/s]
 88%|████████▊ | 316/360 [01:06<00:08,  5.15it/s]
 88%|████████▊ | 317/360 [01:06<00:08,  5.16it/s]
 88%|████████▊ | 318/360 [01:06<00:08,  5.16it/s]
 89%|████████▊ | 319/360 [01:06<00:07,  5.14it/s]
 89%|████████▉ | 320/360 [01:07<00:07,  5.15it/s]
 89%|████████▉ | 321/360 [01:07<00:07,  5.17it/s]
 89%|████████▉ | 322/360 [01:07<00:07,  5.18it/s]
 90%|████████▉ | 323/360 [01:07<00:07,  5.19it/s]
 90%|█████████ | 324/360 [01:07<00:06,  5.18it/s]
 90%|█████████ | 325/360 [01:08<00:06,  5.17it/s]
 91%|█████████ | 326/360 [01:08<00:06,  5.18it/s]
 91%|█████████ | 327/360 [01:08<00:06,  5.18it/s]
 91%|█████████ | 328/360 [01:08<00:06,  5.17it/s]
 91%|█████████▏| 329/360 [01:08<00:06,  5.16it/s]
 92%|█████████▏| 330/360 [01:09<00:05,  5.17it/s]
 92%|█████████▏| 331/360 [01:09<00:05,  5.16it/s]
 92%|█████████▏| 332/360 [01:09<00:05,  5.16it/s]
 92%|█████████▎| 333/360 [01:09<00:05,  5.17it/s]


== Status ==
Current time: 2024-03-07 21:38:38 (running for 00:13:27.96)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

 94%|█████████▍| 340/360 [01:11<00:03,  5.18it/s]
 95%|█████████▍| 341/360 [01:11<00:03,  5.19it/s]
 95%|█████████▌| 342/360 [01:11<00:03,  5.19it/s]
 95%|█████████▌| 343/360 [01:11<00:03,  5.17it/s]
 96%|█████████▌| 344/360 [01:11<00:03,  5.16it/s]
 96%|█████████▌| 345/360 [01:12<00:02,  5.16it/s]
 96%|█████████▌| 346/360 [01:12<00:02,  5.16it/s]
 96%|█████████▋| 347/360 [01:12<00:02,  5.17it/s]
 97%|█████████▋| 348/360 [01:12<00:02,  5.18it/s]
 97%|█████████▋| 349/360 [01:12<00:02,  5.17it/s]
 97%|█████████▋| 350/360 [01:12<00:01,  5.17it/s]
 98%|█████████▊| 351/360 [01:13<00:01,  5.18it/s]
 98%|█████████▊| 352/360 [01:13<00:01,  5.19it/s]
 98%|█████████▊| 353/360 [01:13<00:01,  5.20it/s]
 98%|█████████▊| 354/360 [01:13<00:01,  5.20it/s]
 99%|█████████▊| 355/360 [01:13<00:00,  5.17it/s]
 99%|█████████▉| 356/360 [01:14<00:00,  5.18it/s]
 99%|█████████▉| 357/360 [01:14<00:00,  5.18it/s]
 99%|█████████▉| 358/360 [01:14<00:00,  5.18it/s]
100%|█████████▉| 359/360 [01:14<00:00,  5.17it/s]


== Status ==
Current time: 2024-03-07 21:38:43 (running for 00:13:33.00)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (4 PENDING, 1 RUNNING, 10 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00010 | RUNNING    | 172.19.0.1:10434 |     1.0763e-0

[36m(_objective pid=10434)[0m 
                                                 
100%|██████████| 360/360 [01:16<00:00,  5.47it/s]
100%|██████████| 5/5 [00:01<00:00,  4.47it/s][A
                                             [A
100%|██████████| 360/360 [01:16<00:00,  4.73it/s]


== Status ==
Current time: 2024-03-07 21:38:48 (running for 00:13:38.01)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

[36m(_objective pid=10685)[0m 2024-03-07 21:38:49.769764: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=10685)[0m 2024-03-07 21:38:49.769820: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=10685)[0m 2024-03-07 21:38:49.771151: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
[36m(_objective pid=10685)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weig

== Status ==
Current time: 2024-03-07 21:38:53 (running for 00:13:43.06)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

  1%|          | 2/180 [00:00<01:17,  2.31it/s]
  2%|▏         | 3/180 [00:01<01:10,  2.52it/s]
  2%|▏         | 4/180 [00:01<01:06,  2.63it/s]
  3%|▎         | 5/180 [00:01<01:05,  2.67it/s]
  3%|▎         | 6/180 [00:02<01:03,  2.72it/s]
  4%|▍         | 7/180 [00:02<01:03,  2.74it/s]
  4%|▍         | 8/180 [00:03<01:02,  2.77it/s]
  5%|▌         | 9/180 [00:03<01:01,  2.78it/s]
  6%|▌         | 10/180 [00:03<01:00,  2.79it/s]
  6%|▌         | 11/180 [00:04<01:00,  2.80it/s]
  7%|▋         | 12/180 [00:04<00:59,  2.80it/s]
  7%|▋         | 13/180 [00:04<00:59,  2.80it/s]
  8%|▊         | 14/180 [00:05<00:59,  2.80it/s]
  8%|▊         | 15/180 [00:05<00:58,  2.80it/s]


== Status ==
Current time: 2024-03-07 21:38:59 (running for 00:13:48.10)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

  9%|▉         | 16/180 [00:05<00:58,  2.80it/s]
  9%|▉         | 17/180 [00:06<00:58,  2.81it/s]
 10%|█         | 18/180 [00:06<00:57,  2.80it/s]
 11%|█         | 19/180 [00:06<00:57,  2.80it/s]
 11%|█         | 20/180 [00:07<00:56,  2.81it/s]
 12%|█▏        | 21/180 [00:07<00:56,  2.80it/s]
 12%|█▏        | 22/180 [00:08<00:56,  2.81it/s]
 13%|█▎        | 23/180 [00:08<00:55,  2.81it/s]
 13%|█▎        | 24/180 [00:08<00:55,  2.80it/s]
 14%|█▍        | 25/180 [00:09<00:55,  2.81it/s]
 14%|█▍        | 26/180 [00:09<00:54,  2.80it/s]
 15%|█▌        | 27/180 [00:09<00:54,  2.81it/s]
 16%|█▌        | 28/180 [00:10<00:54,  2.81it/s]
 16%|█▌        | 29/180 [00:10<00:53,  2.80it/s]


== Status ==
Current time: 2024-03-07 21:39:04 (running for 00:13:53.14)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

 17%|█▋        | 30/180 [00:10<00:53,  2.80it/s]
 17%|█▋        | 31/180 [00:11<00:53,  2.80it/s]
 18%|█▊        | 32/180 [00:11<00:52,  2.80it/s]
 18%|█▊        | 33/180 [00:11<00:52,  2.81it/s]
 19%|█▉        | 34/180 [00:12<00:51,  2.81it/s]
 19%|█▉        | 35/180 [00:12<00:51,  2.80it/s]
 20%|██        | 36/180 [00:12<00:49,  2.90it/s]
[36m(_objective pid=10685)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=10685)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.57it/s][A
[36m(_objective pid=10685)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.32it/s][A
[36m(_objective pid=10685)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.65it/s][A
[36m(_objective pid=10685)[0m 
                                                
 20%|██        | 36/180 [00:14<00:49,  2.90it/s]
100%|██████████| 5/5 [00:01<00:00,  4.47it/s][A
                                             [A


[36m(_objective pid=10685)[0m {'eval_loss': 0.6909559369087219, 'eval_accuracy': 0.5949367088607594, 'eval_runtime': 1.2981, 'eval_samples_per_second': 60.858, 'eval_steps_per_second': 3.852, 'epoch': 1.0}


 21%|██        | 37/180 [00:14<01:46,  1.34it/s]
 21%|██        | 38/180 [00:15<01:29,  1.59it/s]
 22%|██▏       | 39/180 [00:15<01:17,  1.83it/s]
 22%|██▏       | 40/180 [00:15<01:08,  2.03it/s]


== Status ==
Current time: 2024-03-07 21:39:09 (running for 00:13:58.24)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

 23%|██▎       | 41/180 [00:16<01:02,  2.21it/s]
 23%|██▎       | 42/180 [00:16<00:58,  2.36it/s]
 24%|██▍       | 43/180 [00:16<00:55,  2.48it/s]
 24%|██▍       | 44/180 [00:17<00:52,  2.57it/s]
 25%|██▌       | 45/180 [00:17<00:51,  2.63it/s]
 26%|██▌       | 46/180 [00:17<00:49,  2.68it/s]
 26%|██▌       | 47/180 [00:18<00:48,  2.72it/s]
 27%|██▋       | 48/180 [00:18<00:48,  2.74it/s]
 27%|██▋       | 49/180 [00:18<00:47,  2.76it/s]
 28%|██▊       | 50/180 [00:19<00:46,  2.78it/s]
 28%|██▊       | 51/180 [00:19<00:46,  2.78it/s]
 29%|██▉       | 52/180 [00:20<00:45,  2.79it/s]
 29%|██▉       | 53/180 [00:20<00:45,  2.79it/s]
 30%|███       | 54/180 [00:20<00:45,  2.79it/s]


== Status ==
Current time: 2024-03-07 21:39:14 (running for 00:14:03.28)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

 31%|███       | 55/180 [00:21<00:44,  2.79it/s]
 31%|███       | 56/180 [00:21<00:44,  2.80it/s]
 32%|███▏      | 57/180 [00:21<00:43,  2.80it/s]
 32%|███▏      | 58/180 [00:22<00:43,  2.80it/s]
 33%|███▎      | 59/180 [00:22<00:43,  2.80it/s]
 33%|███▎      | 60/180 [00:22<00:42,  2.80it/s]
 34%|███▍      | 61/180 [00:23<00:42,  2.81it/s]
 34%|███▍      | 62/180 [00:23<00:42,  2.80it/s]
 35%|███▌      | 63/180 [00:23<00:41,  2.80it/s]
 36%|███▌      | 64/180 [00:24<00:41,  2.80it/s]
 36%|███▌      | 65/180 [00:24<00:41,  2.80it/s]
 37%|███▋      | 66/180 [00:25<00:40,  2.80it/s]
 37%|███▋      | 67/180 [00:25<00:40,  2.80it/s]
 38%|███▊      | 68/180 [00:25<00:40,  2.80it/s]


== Status ==
Current time: 2024-03-07 21:39:19 (running for 00:14:08.31)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

 38%|███▊      | 69/180 [00:26<00:39,  2.80it/s]
 39%|███▉      | 70/180 [00:26<00:39,  2.80it/s]
 39%|███▉      | 71/180 [00:26<00:38,  2.80it/s]
 40%|████      | 72/180 [00:27<00:37,  2.90it/s]
[36m(_objective pid=10685)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=10685)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.45it/s][A
[36m(_objective pid=10685)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.35it/s][A
[36m(_objective pid=10685)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.67it/s][A
[36m(_objective pid=10685)[0m 
                                                
 40%|████      | 72/180 [00:28<00:37,  2.90it/s]
100%|██████████| 5/5 [00:01<00:00,  4.48it/s][A
                                             [A


[36m(_objective pid=10685)[0m {'eval_loss': 0.6571863889694214, 'eval_accuracy': 0.6075949367088608, 'eval_runtime': 1.2972, 'eval_samples_per_second': 60.899, 'eval_steps_per_second': 3.854, 'epoch': 2.0}


 41%|████      | 73/180 [00:28<01:19,  1.35it/s]
 41%|████      | 74/180 [00:29<01:06,  1.60it/s]
 42%|████▏     | 75/180 [00:29<00:57,  1.84it/s]
 42%|████▏     | 76/180 [00:29<00:50,  2.05it/s]
 43%|████▎     | 77/180 [00:30<00:46,  2.23it/s]
 43%|████▎     | 78/180 [00:30<00:42,  2.37it/s]
 44%|████▍     | 79/180 [00:30<00:40,  2.50it/s]


== Status ==
Current time: 2024-03-07 21:39:24 (running for 00:14:13.37)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

 44%|████▍     | 80/180 [00:31<00:38,  2.58it/s]
 45%|████▌     | 81/180 [00:31<00:37,  2.64it/s]
 46%|████▌     | 82/180 [00:31<00:36,  2.69it/s]
 46%|████▌     | 83/180 [00:32<00:35,  2.72it/s]
 47%|████▋     | 84/180 [00:32<00:35,  2.74it/s]
 47%|████▋     | 85/180 [00:33<00:34,  2.76it/s]
 48%|████▊     | 86/180 [00:33<00:33,  2.77it/s]
 48%|████▊     | 87/180 [00:33<00:33,  2.78it/s]
 49%|████▉     | 88/180 [00:34<00:33,  2.79it/s]
 49%|████▉     | 89/180 [00:34<00:32,  2.79it/s]
 50%|█████     | 90/180 [00:34<00:32,  2.79it/s]
 51%|█████     | 91/180 [00:35<00:31,  2.79it/s]
 51%|█████     | 92/180 [00:35<00:31,  2.80it/s]
 52%|█████▏    | 93/180 [00:35<00:31,  2.80it/s]


== Status ==
Current time: 2024-03-07 21:39:29 (running for 00:14:18.41)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

 52%|█████▏    | 94/180 [00:36<00:30,  2.80it/s]
 53%|█████▎    | 95/180 [00:36<00:30,  2.79it/s]
 53%|█████▎    | 96/180 [00:37<00:30,  2.79it/s]
 54%|█████▍    | 97/180 [00:37<00:29,  2.80it/s]
 54%|█████▍    | 98/180 [00:37<00:29,  2.80it/s]
 55%|█████▌    | 99/180 [00:38<00:28,  2.80it/s]
 56%|█████▌    | 100/180 [00:38<00:28,  2.80it/s]
 56%|█████▌    | 101/180 [00:38<00:28,  2.80it/s]
 57%|█████▋    | 102/180 [00:39<00:27,  2.80it/s]
 57%|█████▋    | 103/180 [00:39<00:27,  2.79it/s]
 58%|█████▊    | 104/180 [00:39<00:27,  2.80it/s]
 58%|█████▊    | 105/180 [00:40<00:26,  2.80it/s]
 59%|█████▉    | 106/180 [00:40<00:26,  2.79it/s]
 59%|█████▉    | 107/180 [00:40<00:26,  2.80it/s]


== Status ==
Current time: 2024-03-07 21:39:34 (running for 00:14:23.45)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

 60%|██████    | 108/180 [00:41<00:24,  2.91it/s]
[36m(_objective pid=10685)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=10685)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.62it/s][A
[36m(_objective pid=10685)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.37it/s][A
[36m(_objective pid=10685)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.68it/s][A
[36m(_objective pid=10685)[0m 
                                                 
 60%|██████    | 108/180 [00:42<00:24,  2.91it/s]
100%|██████████| 5/5 [00:01<00:00,  4.47it/s][A
                                             [A


[36m(_objective pid=10685)[0m {'eval_loss': 0.6626661419868469, 'eval_accuracy': 0.569620253164557, 'eval_runtime': 1.2995, 'eval_samples_per_second': 60.791, 'eval_steps_per_second': 3.848, 'epoch': 3.0}


 61%|██████    | 109/180 [00:42<00:52,  1.35it/s]
 61%|██████    | 110/180 [00:43<00:43,  1.60it/s]
 62%|██████▏   | 111/180 [00:43<00:37,  1.83it/s]
 62%|██████▏   | 112/180 [00:43<00:33,  2.05it/s]
 63%|██████▎   | 113/180 [00:44<00:30,  2.23it/s]
 63%|██████▎   | 114/180 [00:44<00:27,  2.37it/s]
 64%|██████▍   | 115/180 [00:45<00:26,  2.48it/s]
 64%|██████▍   | 116/180 [00:45<00:24,  2.57it/s]
 65%|██████▌   | 117/180 [00:45<00:23,  2.64it/s]
 66%|██████▌   | 118/180 [00:46<00:23,  2.69it/s]


== Status ==
Current time: 2024-03-07 21:39:39 (running for 00:14:28.50)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

 66%|██████▌   | 119/180 [00:46<00:22,  2.72it/s]
 67%|██████▋   | 120/180 [00:46<00:21,  2.75it/s]
 67%|██████▋   | 121/180 [00:47<00:21,  2.76it/s]
 68%|██████▊   | 122/180 [00:47<00:20,  2.77it/s]
 68%|██████▊   | 123/180 [00:47<00:20,  2.78it/s]
 69%|██████▉   | 124/180 [00:48<00:20,  2.79it/s]
 69%|██████▉   | 125/180 [00:48<00:19,  2.79it/s]
 70%|███████   | 126/180 [00:48<00:19,  2.80it/s]
 71%|███████   | 127/180 [00:49<00:18,  2.80it/s]
 71%|███████   | 128/180 [00:49<00:18,  2.80it/s]
 72%|███████▏  | 129/180 [00:50<00:18,  2.80it/s]
 72%|███████▏  | 130/180 [00:50<00:17,  2.80it/s]
 73%|███████▎  | 131/180 [00:50<00:17,  2.80it/s]
 73%|███████▎  | 132/180 [00:51<00:17,  2.80it/s]


== Status ==
Current time: 2024-03-07 21:39:44 (running for 00:14:33.54)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

 74%|███████▍  | 133/180 [00:51<00:16,  2.80it/s]
 74%|███████▍  | 134/180 [00:51<00:16,  2.80it/s]
 75%|███████▌  | 135/180 [00:52<00:16,  2.80it/s]
 76%|███████▌  | 136/180 [00:52<00:15,  2.80it/s]
 76%|███████▌  | 137/180 [00:52<00:15,  2.79it/s]
 77%|███████▋  | 138/180 [00:53<00:14,  2.80it/s]
 77%|███████▋  | 139/180 [00:53<00:14,  2.79it/s]
 78%|███████▊  | 140/180 [00:53<00:14,  2.80it/s]
 78%|███████▊  | 141/180 [00:54<00:13,  2.80it/s]
 79%|███████▉  | 142/180 [00:54<00:13,  2.79it/s]
 79%|███████▉  | 143/180 [00:55<00:13,  2.81it/s]
 80%|████████  | 144/180 [00:55<00:12,  2.90it/s]
[36m(_objective pid=10685)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=10685)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.61it/s][A
[36m(_objective pid=10685)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.34it/s][A


== Status ==
Current time: 2024-03-07 21:39:49 (running for 00:14:38.57)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

[36m(_objective pid=10685)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.65it/s][A
[36m(_objective pid=10685)[0m 
                                                 
 80%|████████  | 144/180 [00:56<00:12,  2.90it/s]
100%|██████████| 5/5 [00:01<00:00,  4.48it/s][A
                                             [A


[36m(_objective pid=10685)[0m {'eval_loss': 0.6580783724784851, 'eval_accuracy': 0.5949367088607594, 'eval_runtime': 1.2997, 'eval_samples_per_second': 60.783, 'eval_steps_per_second': 3.847, 'epoch': 4.0}


 81%|████████  | 145/180 [00:57<00:25,  1.35it/s]
 81%|████████  | 146/180 [00:57<00:21,  1.60it/s]
 82%|████████▏ | 147/180 [00:57<00:17,  1.84it/s]
 82%|████████▏ | 148/180 [00:58<00:15,  2.05it/s]
 83%|████████▎ | 149/180 [00:58<00:13,  2.23it/s]
 83%|████████▎ | 150/180 [00:58<00:12,  2.37it/s]
 84%|████████▍ | 151/180 [00:59<00:11,  2.49it/s]
 84%|████████▍ | 152/180 [00:59<00:10,  2.57it/s]
 85%|████████▌ | 153/180 [00:59<00:10,  2.63it/s]
 86%|████████▌ | 154/180 [01:00<00:09,  2.69it/s]
 86%|████████▌ | 155/180 [01:00<00:09,  2.71it/s]
 87%|████████▋ | 156/180 [01:00<00:08,  2.74it/s]
 87%|████████▋ | 157/180 [01:01<00:08,  2.76it/s]


== Status ==
Current time: 2024-03-07 21:39:54 (running for 00:14:43.63)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

 88%|████████▊ | 158/180 [01:01<00:07,  2.78it/s]
 88%|████████▊ | 159/180 [01:02<00:07,  2.76it/s]
 89%|████████▉ | 160/180 [01:02<00:07,  2.78it/s]
 89%|████████▉ | 161/180 [01:02<00:06,  2.78it/s]
 90%|█████████ | 162/180 [01:03<00:06,  2.78it/s]
 91%|█████████ | 163/180 [01:03<00:06,  2.79it/s]
 91%|█████████ | 164/180 [01:03<00:05,  2.79it/s]
 92%|█████████▏| 165/180 [01:04<00:05,  2.80it/s]
 92%|█████████▏| 166/180 [01:04<00:05,  2.79it/s]
 93%|█████████▎| 167/180 [01:04<00:04,  2.80it/s]
 93%|█████████▎| 168/180 [01:05<00:04,  2.80it/s]
 94%|█████████▍| 169/180 [01:05<00:03,  2.79it/s]
 94%|█████████▍| 170/180 [01:05<00:03,  2.80it/s]
 95%|█████████▌| 171/180 [01:06<00:03,  2.80it/s]


== Status ==
Current time: 2024-03-07 21:39:59 (running for 00:14:48.66)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 1 RUNNING, 11 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00011 | RUNNING    | 172.19.0.1:10685 |     1.65956e-

 96%|█████████▌| 172/180 [01:06<00:02,  2.80it/s]
 96%|█████████▌| 173/180 [01:07<00:02,  2.80it/s]
 97%|█████████▋| 174/180 [01:07<00:02,  2.81it/s]
 97%|█████████▋| 175/180 [01:07<00:01,  2.80it/s]
 98%|█████████▊| 176/180 [01:08<00:01,  2.79it/s]
 98%|█████████▊| 177/180 [01:08<00:01,  2.80it/s]
 99%|█████████▉| 178/180 [01:08<00:00,  2.80it/s]
 99%|█████████▉| 179/180 [01:09<00:00,  2.80it/s]
100%|██████████| 180/180 [01:09<00:00,  2.89it/s]
[36m(_objective pid=10685)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=10685)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.62it/s][A
[36m(_objective pid=10685)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.36it/s][A
[36m(_objective pid=10685)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.66it/s][A
[36m(_objective pid=10685)[0m 
                                                 
100%|██████████| 180/180 [01:10<00:00,  2.89it/s]
100%|██████████| 5/5 [00:01<00:00,  4.50it/s][A
                                             [A

[36m(_objective pid=10685)[0m {'eval_loss': 0.6461213231086731, 'eval_accuracy': 0.620253164556962, 'eval_runtime': 1.294, 'eval_samples_per_second': 61.053, 'eval_steps_per_second': 3.864, 'epoch': 5.0}


100%|██████████| 180/180 [01:10<00:00,  2.54it/s]


[36m(_objective pid=10685)[0m {'train_runtime': 70.8123, 'train_samples_per_second': 20.265, 'train_steps_per_second': 2.542, 'train_loss': 0.5998219807942708, 'epoch': 5.0}
== Status ==
Current time: 2024-03-07 21:40:04 (running for 00:14:53.75)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (3 PENDING, 12 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+---

[36m(_objective pid=10928)[0m 2024-03-07 21:40:09.634500: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=10928)[0m 2024-03-07 21:40:09.634553: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=10928)[0m 2024-03-07 21:40:09.635877: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered


== Status ==
Current time: 2024-03-07 21:40:09 (running for 00:14:58.81)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (2 PENDING, 1 RUNNING, 12 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00012 | RUNNING    | 172.19.0.1:10928 |     3.29276e-

[36m(_objective pid=10928)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
[36m(_objective pid=10928)[0m You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
  0%|          | 0/216 [00:00<?, ?it/s]
  0%|          | 1/216 [00:00<01:24,  2.54it/s]
  1%|          | 2/216 [00:00<00:56,  3.76it/s]
  1%|▏         | 3/216 [00:00<00:49,  4.30it/s]
  2%|▏         | 4/216 [00:00<00:46,  4.61it/s]
  2%|▏         | 5/216 [00:01<00:43,  4.81it/s]
  3%|▎         | 6/216 [00:01<00:42,  4.93it/s]
  3%|▎         | 7/216 [00:01<00:41,  5.00it/s]
  4%|▎         | 8/216 [00:01<00:41,  5.06it/s]


== Status ==
Current time: 2024-03-07 21:40:14 (running for 00:15:03.86)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (2 PENDING, 1 RUNNING, 12 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00012 | RUNNING    | 172.19.0.1:10928 |     3.29276e-

  4%|▍         | 9/216 [00:01<00:40,  5.07it/s]
  5%|▍         | 10/216 [00:02<00:40,  5.11it/s]
  5%|▌         | 11/216 [00:02<00:39,  5.14it/s]
  6%|▌         | 12/216 [00:02<00:39,  5.16it/s]
  6%|▌         | 13/216 [00:02<00:39,  5.19it/s]
  6%|▋         | 14/216 [00:02<00:39,  5.17it/s]
  7%|▋         | 15/216 [00:03<00:38,  5.17it/s]
  7%|▋         | 16/216 [00:03<00:38,  5.18it/s]
  8%|▊         | 17/216 [00:03<00:38,  5.19it/s]
  8%|▊         | 18/216 [00:03<00:38,  5.20it/s]
  9%|▉         | 19/216 [00:03<00:38,  5.18it/s]
  9%|▉         | 20/216 [00:04<00:37,  5.18it/s]
 10%|▉         | 21/216 [00:04<00:37,  5.17it/s]
 10%|█         | 22/216 [00:04<00:37,  5.18it/s]
 11%|█         | 23/216 [00:04<00:37,  5.18it/s]
 11%|█         | 24/216 [00:04<00:37,  5.16it/s]
 12%|█▏        | 25/216 [00:05<00:36,  5.18it/s]
 12%|█▏        | 26/216 [00:05<00:36,  5.19it/s]
 12%|█▎        | 27/216 [00:05<00:36,  5.19it/s]
 13%|█▎        | 28/216 [00:05<00:36,  5.19it/s]
 13%|█▎        | 29/2

== Status ==
Current time: 2024-03-07 21:40:19 (running for 00:15:08.90)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (2 PENDING, 1 RUNNING, 12 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00012 | RUNNING    | 172.19.0.1:10928 |     3.29276e-

 17%|█▋        | 36/216 [00:07<00:34,  5.17it/s]
 17%|█▋        | 37/216 [00:07<00:34,  5.17it/s]
 18%|█▊        | 38/216 [00:07<00:34,  5.17it/s]
 18%|█▊        | 39/216 [00:07<00:34,  5.16it/s]
 19%|█▊        | 40/216 [00:07<00:34,  5.15it/s]
 19%|█▉        | 41/216 [00:08<00:33,  5.17it/s]
 19%|█▉        | 42/216 [00:08<00:33,  5.19it/s]
 20%|█▉        | 43/216 [00:08<00:33,  5.19it/s]
 20%|██        | 44/216 [00:08<00:33,  5.20it/s]
 21%|██        | 45/216 [00:08<00:33,  5.18it/s]
 21%|██▏       | 46/216 [00:09<00:32,  5.19it/s]
 22%|██▏       | 47/216 [00:09<00:32,  5.20it/s]
 22%|██▏       | 48/216 [00:09<00:32,  5.19it/s]
 23%|██▎       | 49/216 [00:09<00:32,  5.20it/s]
 23%|██▎       | 50/216 [00:09<00:32,  5.17it/s]
 24%|██▎       | 51/216 [00:10<00:31,  5.17it/s]
 24%|██▍       | 52/216 [00:10<00:31,  5.17it/s]
 25%|██▍       | 53/216 [00:10<00:31,  5.18it/s]
 25%|██▌       | 54/216 [00:10<00:31,  5.19it/s]
 25%|██▌       | 55/216 [00:10<00:31,  5.18it/s]
 26%|██▌       | 56/

== Status ==
Current time: 2024-03-07 21:40:24 (running for 00:15:13.93)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (2 PENDING, 1 RUNNING, 12 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00012 | RUNNING    | 172.19.0.1:10928 |     3.29276e-

 28%|██▊       | 61/216 [00:11<00:29,  5.21it/s]
 29%|██▊       | 62/216 [00:12<00:29,  5.20it/s]
 29%|██▉       | 63/216 [00:12<00:29,  5.18it/s]
 30%|██▉       | 64/216 [00:12<00:29,  5.18it/s]
 30%|███       | 65/216 [00:12<00:29,  5.18it/s]
 31%|███       | 66/216 [00:12<00:29,  5.17it/s]
 31%|███       | 67/216 [00:13<00:28,  5.17it/s]
 31%|███▏      | 68/216 [00:13<00:28,  5.18it/s]
 32%|███▏      | 69/216 [00:13<00:28,  5.18it/s]
 32%|███▏      | 70/216 [00:13<00:28,  5.19it/s]
 33%|███▎      | 71/216 [00:13<00:27,  5.18it/s]
 33%|███▎      | 72/216 [00:14<00:26,  5.51it/s]
[36m(_objective pid=10928)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=10928)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.59it/s][A
[36m(_objective pid=10928)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.34it/s][A
[36m(_objective pid=10928)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.67it/s][A
[36m(_objective pid=10928)[0m 
                                                
 33%|███▎ 

[36m(_objective pid=10928)[0m {'eval_loss': 0.6905173659324646, 'eval_accuracy': 0.5569620253164557, 'eval_runtime': 1.2964, 'eval_samples_per_second': 60.937, 'eval_steps_per_second': 3.857, 'epoch': 1.0}


 34%|███▍      | 73/216 [00:15<01:22,  1.73it/s]
 34%|███▍      | 74/216 [00:15<01:05,  2.16it/s]
 35%|███▍      | 75/216 [00:15<00:53,  2.62it/s]
 35%|███▌      | 76/216 [00:16<00:45,  3.07it/s]
 36%|███▌      | 77/216 [00:16<00:39,  3.50it/s]
 36%|███▌      | 78/216 [00:16<00:35,  3.87it/s]
 37%|███▋      | 79/216 [00:16<00:32,  4.17it/s]
 37%|███▋      | 80/216 [00:16<00:30,  4.40it/s]


== Status ==
Current time: 2024-03-07 21:40:29 (running for 00:15:18.96)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (2 PENDING, 1 RUNNING, 12 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00012 | RUNNING    | 172.19.0.1:10928 |     3.29276e-

 38%|███▊      | 81/216 [00:17<00:29,  4.61it/s]
 38%|███▊      | 82/216 [00:17<00:28,  4.77it/s]
 38%|███▊      | 83/216 [00:17<00:27,  4.90it/s]
 39%|███▉      | 84/216 [00:17<00:26,  4.98it/s]
 39%|███▉      | 85/216 [00:17<00:26,  5.02it/s]
 40%|███▉      | 86/216 [00:18<00:25,  5.08it/s]
 40%|████      | 87/216 [00:18<00:25,  5.12it/s]
 41%|████      | 88/216 [00:18<00:24,  5.13it/s]
 41%|████      | 89/216 [00:18<00:24,  5.15it/s]
 42%|████▏     | 90/216 [00:18<00:24,  5.13it/s]
 42%|████▏     | 91/216 [00:19<00:24,  5.13it/s]
 43%|████▎     | 92/216 [00:19<00:24,  5.14it/s]
 43%|████▎     | 93/216 [00:19<00:23,  5.15it/s]
 44%|████▎     | 94/216 [00:19<00:23,  5.16it/s]
 44%|████▍     | 95/216 [00:19<00:23,  5.15it/s]
 44%|████▍     | 96/216 [00:19<00:23,  5.17it/s]
 45%|████▍     | 97/216 [00:20<00:23,  5.17it/s]
 45%|████▌     | 98/216 [00:20<00:22,  5.19it/s]
 46%|████▌     | 99/216 [00:20<00:22,  5.20it/s]
 46%|████▋     | 100/216 [00:20<00:22,  5.19it/s]
 47%|████▋     | 10

== Status ==
Current time: 2024-03-07 21:40:34 (running for 00:15:24.01)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (2 PENDING, 1 RUNNING, 12 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00012 | RUNNING    | 172.19.0.1:10928 |     3.29276e-

 50%|████▉     | 107/216 [00:22<00:21,  5.16it/s]
 50%|█████     | 108/216 [00:22<00:20,  5.17it/s]
 50%|█████     | 109/216 [00:22<00:20,  5.18it/s]
 51%|█████     | 110/216 [00:22<00:20,  5.19it/s]
 51%|█████▏    | 111/216 [00:22<00:20,  5.18it/s]
 52%|█████▏    | 112/216 [00:23<00:20,  5.18it/s]
 52%|█████▏    | 113/216 [00:23<00:19,  5.20it/s]
 53%|█████▎    | 114/216 [00:23<00:19,  5.20it/s]
 53%|█████▎    | 115/216 [00:23<00:19,  5.19it/s]
 54%|█████▎    | 116/216 [00:23<00:19,  5.17it/s]
 54%|█████▍    | 117/216 [00:24<00:19,  5.17it/s]
 55%|█████▍    | 118/216 [00:24<00:18,  5.17it/s]
 55%|█████▌    | 119/216 [00:24<00:18,  5.17it/s]
 56%|█████▌    | 120/216 [00:24<00:18,  5.17it/s]
 56%|█████▌    | 121/216 [00:24<00:18,  5.14it/s]
 56%|█████▋    | 122/216 [00:25<00:18,  5.15it/s]
 57%|█████▋    | 123/216 [00:25<00:18,  5.16it/s]
 57%|█████▋    | 124/216 [00:25<00:17,  5.17it/s]
 58%|█████▊    | 125/216 [00:25<00:17,  5.18it/s]
 58%|█████▊    | 126/216 [00:25<00:17,  5.17it/s]


== Status ==
Current time: 2024-03-07 21:40:39 (running for 00:15:29.05)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (2 PENDING, 1 RUNNING, 12 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00012 | RUNNING    | 172.19.0.1:10928 |     3.29276e-

 62%|██████▏   | 133/216 [00:27<00:16,  5.16it/s]
 62%|██████▏   | 134/216 [00:27<00:15,  5.17it/s]
 62%|██████▎   | 135/216 [00:27<00:15,  5.17it/s]
 63%|██████▎   | 136/216 [00:27<00:15,  5.17it/s]
 63%|██████▎   | 137/216 [00:27<00:15,  5.16it/s]
 64%|██████▍   | 138/216 [00:28<00:15,  5.16it/s]
 64%|██████▍   | 139/216 [00:28<00:14,  5.16it/s]
 65%|██████▍   | 140/216 [00:28<00:14,  5.18it/s]
 65%|██████▌   | 141/216 [00:28<00:14,  5.18it/s]
 66%|██████▌   | 142/216 [00:28<00:14,  5.17it/s]
 66%|██████▌   | 143/216 [00:29<00:14,  5.19it/s]
 67%|██████▋   | 144/216 [00:29<00:13,  5.52it/s]
[36m(_objective pid=10928)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=10928)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.68it/s][A
[36m(_objective pid=10928)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.36it/s][A
[36m(_objective pid=10928)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.69it/s][A
[36m(_objective pid=10928)[0m 
                                               

[36m(_objective pid=10928)[0m {'eval_loss': 0.6914498805999756, 'eval_accuracy': 0.5443037974683544, 'eval_runtime': 1.296, 'eval_samples_per_second': 60.958, 'eval_steps_per_second': 3.858, 'epoch': 2.0}


 67%|██████▋   | 145/216 [00:30<00:40,  1.74it/s]
 68%|██████▊   | 146/216 [00:30<00:32,  2.16it/s]
 68%|██████▊   | 147/216 [00:31<00:26,  2.62it/s]
 69%|██████▊   | 148/216 [00:31<00:22,  3.08it/s]
 69%|██████▉   | 149/216 [00:31<00:19,  3.52it/s]
 69%|██████▉   | 150/216 [00:31<00:16,  3.89it/s]
 70%|██████▉   | 151/216 [00:31<00:15,  4.19it/s]


== Status ==
Current time: 2024-03-07 21:40:44 (running for 00:15:34.05)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (2 PENDING, 1 RUNNING, 12 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00012 | RUNNING    | 172.19.0.1:10928 |     3.29276e-

 70%|███████   | 152/216 [00:32<00:14,  4.45it/s]
 71%|███████   | 153/216 [00:32<00:13,  4.65it/s]
 71%|███████▏  | 154/216 [00:32<00:12,  4.81it/s]
 72%|███████▏  | 155/216 [00:32<00:12,  4.92it/s]
 72%|███████▏  | 156/216 [00:32<00:12,  4.96it/s]
 73%|███████▎  | 157/216 [00:33<00:11,  5.03it/s]
 73%|███████▎  | 158/216 [00:33<00:11,  5.06it/s]
 74%|███████▎  | 159/216 [00:33<00:11,  5.09it/s]
 74%|███████▍  | 160/216 [00:33<00:10,  5.12it/s]
 75%|███████▍  | 161/216 [00:33<00:10,  5.12it/s]
 75%|███████▌  | 162/216 [00:34<00:10,  5.13it/s]
 75%|███████▌  | 163/216 [00:34<00:10,  5.15it/s]
 76%|███████▌  | 164/216 [00:34<00:10,  5.17it/s]
 76%|███████▋  | 165/216 [00:34<00:09,  5.19it/s]
 77%|███████▋  | 166/216 [00:34<00:09,  5.18it/s]
 77%|███████▋  | 167/216 [00:34<00:09,  5.18it/s]
 78%|███████▊  | 168/216 [00:35<00:09,  5.18it/s]
 78%|███████▊  | 169/216 [00:35<00:09,  5.18it/s]
 79%|███████▊  | 170/216 [00:35<00:08,  5.19it/s]
 79%|███████▉  | 171/216 [00:35<00:08,  5.18it/s]


== Status ==
Current time: 2024-03-07 21:40:50 (running for 00:15:39.09)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (2 PENDING, 1 RUNNING, 12 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00012 | RUNNING    | 172.19.0.1:10928 |     3.29276e-

 83%|████████▎ | 179/216 [00:37<00:07,  5.19it/s]
 83%|████████▎ | 180/216 [00:37<00:06,  5.18it/s]
 84%|████████▍ | 181/216 [00:37<00:06,  5.19it/s]
 84%|████████▍ | 182/216 [00:37<00:06,  5.18it/s]
 85%|████████▍ | 183/216 [00:38<00:06,  5.19it/s]
 85%|████████▌ | 184/216 [00:38<00:06,  5.20it/s]
 86%|████████▌ | 185/216 [00:38<00:05,  5.20it/s]
 86%|████████▌ | 186/216 [00:38<00:05,  5.19it/s]
 87%|████████▋ | 187/216 [00:38<00:05,  5.15it/s]
 87%|████████▋ | 188/216 [00:39<00:05,  5.16it/s]
 88%|████████▊ | 189/216 [00:39<00:05,  5.17it/s]
 88%|████████▊ | 190/216 [00:39<00:05,  5.17it/s]
 88%|████████▊ | 191/216 [00:39<00:04,  5.17it/s]
 89%|████████▉ | 192/216 [00:39<00:04,  5.16it/s]
 89%|████████▉ | 193/216 [00:40<00:04,  5.18it/s]
 90%|████████▉ | 194/216 [00:40<00:04,  5.19it/s]
 90%|█████████ | 195/216 [00:40<00:04,  5.20it/s]
 91%|█████████ | 196/216 [00:40<00:03,  5.20it/s]
 91%|█████████ | 197/216 [00:40<00:03,  5.20it/s]
 92%|█████████▏| 198/216 [00:40<00:03,  5.18it/s]


== Status ==
Current time: 2024-03-07 21:40:55 (running for 00:15:44.14)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (2 PENDING, 1 RUNNING, 12 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00012 | RUNNING    | 172.19.0.1:10928 |     3.29276e-

 95%|█████████▌| 206/216 [00:42<00:01,  5.13it/s]
 96%|█████████▌| 207/216 [00:42<00:01,  5.15it/s]
 96%|█████████▋| 208/216 [00:42<00:01,  5.15it/s]
 97%|█████████▋| 209/216 [00:43<00:01,  5.17it/s]
 97%|█████████▋| 210/216 [00:43<00:01,  5.17it/s]
 98%|█████████▊| 211/216 [00:43<00:00,  5.18it/s]
 98%|█████████▊| 212/216 [00:43<00:00,  5.19it/s]
 99%|█████████▊| 213/216 [00:43<00:00,  5.18it/s]
 99%|█████████▉| 214/216 [00:44<00:00,  5.19it/s]
100%|█████████▉| 215/216 [00:44<00:00,  5.20it/s]
100%|██████████| 216/216 [00:44<00:00,  5.50it/s]
[36m(_objective pid=10928)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=10928)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.46it/s][A
[36m(_objective pid=10928)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.34it/s][A
[36m(_objective pid=10928)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.65it/s][A
[36m(_objective pid=10928)[0m 
                                                 
100%|██████████| 216/216 [00:45<00:00,  5.50it/

[36m(_objective pid=10928)[0m {'eval_loss': 0.6876307129859924, 'eval_accuracy': 0.5949367088607594, 'eval_runtime': 1.3003, 'eval_samples_per_second': 60.756, 'eval_steps_per_second': 3.845, 'epoch': 3.0}
[36m(_objective pid=10928)[0m {'train_runtime': 45.7266, 'train_samples_per_second': 18.829, 'train_steps_per_second': 4.724, 'train_loss': 0.6871809782805266, 'epoch': 3.0}
== Status ==
Current time: 2024-03-07 21:41:00 (running for 00:15:49.15)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (2 PENDING, 13 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|      

[36m(_objective pid=11103)[0m 2024-03-07 21:41:04.700186: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=11103)[0m 2024-03-07 21:41:04.700239: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=11103)[0m 2024-03-07 21:41:04.701475: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered


== Status ==
Current time: 2024-03-07 21:41:05 (running for 00:15:54.25)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 PENDING, 1 RUNNING, 13 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00013 | RUNNING    | 172.19.0.1:11103 |     1.24e-05 

[36m(_objective pid=11103)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
[36m(_objective pid=11103)[0m You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
  0%|          | 0/72 [00:00<?, ?it/s]
  1%|▏         | 1/72 [00:00<00:28,  2.46it/s]
  3%|▎         | 2/72 [00:00<00:19,  3.67it/s]
  4%|▍         | 3/72 [00:00<00:16,  4.23it/s]
  6%|▌         | 4/72 [00:00<00:14,  4.57it/s]
  7%|▋         | 5/72 [00:01<00:13,  4.79it/s]
  8%|▊         | 6/72 [00:01<00:13,  4.90it/s]
 10%|▉         | 7/72 [00:01<00:12,  5.01it/s]
 11%|█         | 8/72 [00:01<00:12,  5.03it/s]
 12%|█▎        | 9/72 [00:01<00:12,  5.08it/s]
 14%|█▍        | 10/72 [00:02<00:12,  5.11it/s]


== Status ==
Current time: 2024-03-07 21:41:10 (running for 00:15:59.28)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 PENDING, 1 RUNNING, 13 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00013 | RUNNING    | 172.19.0.1:11103 |     1.24e-05 

 15%|█▌        | 11/72 [00:02<00:11,  5.14it/s]
 17%|█▋        | 12/72 [00:02<00:11,  5.16it/s]
 18%|█▊        | 13/72 [00:02<00:11,  5.16it/s]
 19%|█▉        | 14/72 [00:02<00:11,  5.17it/s]
 21%|██        | 15/72 [00:03<00:10,  5.18it/s]
 22%|██▏       | 16/72 [00:03<00:10,  5.19it/s]
 24%|██▎       | 17/72 [00:03<00:10,  5.20it/s]
 25%|██▌       | 18/72 [00:03<00:10,  5.20it/s]
 26%|██▋       | 19/72 [00:03<00:10,  5.19it/s]
 28%|██▊       | 20/72 [00:04<00:10,  5.17it/s]
 29%|██▉       | 21/72 [00:04<00:09,  5.17it/s]
 31%|███       | 22/72 [00:04<00:09,  5.17it/s]
 32%|███▏      | 23/72 [00:04<00:09,  5.17it/s]
 33%|███▎      | 24/72 [00:04<00:09,  5.17it/s]
 35%|███▍      | 25/72 [00:05<00:09,  5.17it/s]
 36%|███▌      | 26/72 [00:05<00:08,  5.15it/s]
 38%|███▊      | 27/72 [00:05<00:08,  5.17it/s]
 39%|███▉      | 28/72 [00:05<00:08,  5.18it/s]
 40%|████      | 29/72 [00:05<00:08,  5.17it/s]
 42%|████▏     | 30/72 [00:05<00:08,  5.18it/s]
 43%|████▎     | 31/72 [00:06<00:07,  5.

== Status ==
Current time: 2024-03-07 21:41:15 (running for 00:16:04.32)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 PENDING, 1 RUNNING, 13 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00013 | RUNNING    | 172.19.0.1:11103 |     1.24e-05 

 51%|█████▏    | 37/72 [00:07<00:06,  5.17it/s]
 53%|█████▎    | 38/72 [00:07<00:06,  5.16it/s]
 54%|█████▍    | 39/72 [00:07<00:06,  5.14it/s]
 56%|█████▌    | 40/72 [00:07<00:06,  5.15it/s]
 57%|█████▋    | 41/72 [00:08<00:05,  5.17it/s]
 58%|█████▊    | 42/72 [00:08<00:05,  5.18it/s]
 60%|█████▉    | 43/72 [00:08<00:05,  5.20it/s]
 61%|██████    | 44/72 [00:08<00:05,  5.18it/s]
 62%|██████▎   | 45/72 [00:08<00:05,  5.19it/s]
 64%|██████▍   | 46/72 [00:09<00:05,  5.19it/s]
 65%|██████▌   | 47/72 [00:09<00:04,  5.20it/s]
 67%|██████▋   | 48/72 [00:09<00:04,  5.21it/s]
 68%|██████▊   | 49/72 [00:09<00:04,  5.20it/s]
 69%|██████▉   | 50/72 [00:09<00:04,  5.17it/s]
 71%|███████   | 51/72 [00:10<00:04,  5.17it/s]
 72%|███████▏  | 52/72 [00:10<00:03,  5.18it/s]
 74%|███████▎  | 53/72 [00:10<00:03,  5.18it/s]
 75%|███████▌  | 54/72 [00:10<00:03,  5.18it/s]
 76%|███████▋  | 55/72 [00:10<00:03,  5.17it/s]
 78%|███████▊  | 56/72 [00:11<00:03,  5.15it/s]
 79%|███████▉  | 57/72 [00:11<00:02,  5.

== Status ==
Current time: 2024-03-07 21:41:20 (running for 00:16:09.35)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 PENDING, 1 RUNNING, 13 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00013 | RUNNING    | 172.19.0.1:11103 |     1.24e-05 

 88%|████████▊ | 63/72 [00:12<00:01,  5.19it/s]
 89%|████████▉ | 64/72 [00:12<00:01,  5.19it/s]
 90%|█████████ | 65/72 [00:12<00:01,  5.17it/s]
 92%|█████████▏| 66/72 [00:12<00:01,  5.18it/s]
 93%|█████████▎| 67/72 [00:13<00:00,  5.17it/s]
 94%|█████████▍| 68/72 [00:13<00:00,  5.16it/s]
 96%|█████████▌| 69/72 [00:13<00:00,  5.17it/s]
 97%|█████████▋| 70/72 [00:13<00:00,  5.17it/s]
 99%|█████████▊| 71/72 [00:13<00:00,  5.19it/s]
100%|██████████| 72/72 [00:14<00:00,  5.52it/s]
[36m(_objective pid=11103)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=11103)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.57it/s][A
[36m(_objective pid=11103)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.33it/s][A
[36m(_objective pid=11103)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.65it/s][A
[36m(_objective pid=11103)[0m 
                                               A
100%|██████████| 72/72 [00:15<00:00,  5.52it/s]
100%|██████████| 5/5 [00:01<00:00,  4.48it/s][A
100%|██████████| 72/7

[36m(_objective pid=11103)[0m {'eval_loss': 0.6880991458892822, 'eval_accuracy': 0.6075949367088608, 'eval_runtime': 1.2975, 'eval_samples_per_second': 60.886, 'eval_steps_per_second': 3.854, 'epoch': 1.0}
[36m(_objective pid=11103)[0m {'train_runtime': 15.376, 'train_samples_per_second': 18.665, 'train_steps_per_second': 4.683, 'train_loss': 0.6963202688429091, 'epoch': 1.0}
== Status ==
Current time: 2024-03-07 21:41:25 (running for 00:16:14.41)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 PENDING, 14 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|       

[36m(_objective pid=11212)[0m 2024-03-07 21:41:28.692800: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
[36m(_objective pid=11212)[0m 2024-03-07 21:41:28.692854: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
[36m(_objective pid=11212)[0m 2024-03-07 21:41:28.694181: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered


== Status ==
Current time: 2024-03-07 21:41:30 (running for 00:16:19.47)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 RUNNING, 14 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00014 | RUNNING    | 172.19.0.1:11212 |     3.5503e-05  |       

[36m(_objective pid=11212)[0m Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']
[36m(_objective pid=11212)[0m You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
  0%|          | 0/216 [00:00<?, ?it/s]
  0%|          | 1/216 [00:00<01:22,  2.60it/s]
  1%|          | 2/216 [00:00<00:56,  3.81it/s]
  1%|▏         | 3/216 [00:00<00:49,  4.31it/s]
  2%|▏         | 4/216 [00:00<00:45,  4.62it/s]
  2%|▏         | 5/216 [00:01<00:43,  4.81it/s]
  3%|▎         | 6/216 [00:01<00:42,  4.93it/s]
  3%|▎         | 7/216 [00:01<00:41,  5.02it/s]
  4%|▎         | 8/216 [00:01<00:41,  5.07it/s]
  4%|▍         | 9/216 [00:01<00:40,  5.09it/s]
  5%|▍         | 10/216 [00:02<00:40,  5.12it/s]
  5%|▌         | 11/216 [00:02<00:39,  5.14it/s]
  6%|▌       

== Status ==
Current time: 2024-03-07 21:41:35 (running for 00:16:24.50)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 RUNNING, 14 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00014 | RUNNING    | 172.19.0.1:11212 |     3.5503e-05  |       

  8%|▊         | 18/216 [00:03<00:38,  5.19it/s]
  9%|▉         | 19/216 [00:03<00:37,  5.19it/s]
  9%|▉         | 20/216 [00:04<00:37,  5.20it/s]
 10%|▉         | 21/216 [00:04<00:37,  5.19it/s]
 10%|█         | 22/216 [00:04<00:37,  5.20it/s]
 11%|█         | 23/216 [00:04<00:37,  5.19it/s]
 11%|█         | 24/216 [00:04<00:37,  5.16it/s]
 12%|█▏        | 25/216 [00:05<00:36,  5.17it/s]
 12%|█▏        | 26/216 [00:05<00:36,  5.17it/s]
 12%|█▎        | 27/216 [00:05<00:36,  5.17it/s]
 13%|█▎        | 28/216 [00:05<00:36,  5.17it/s]
 13%|█▎        | 29/216 [00:05<00:36,  5.17it/s]
 14%|█▍        | 30/216 [00:05<00:35,  5.18it/s]
 14%|█▍        | 31/216 [00:06<00:35,  5.20it/s]
 15%|█▍        | 32/216 [00:06<00:35,  5.20it/s]
 15%|█▌        | 33/216 [00:06<00:35,  5.19it/s]
 16%|█▌        | 34/216 [00:06<00:35,  5.18it/s]
 16%|█▌        | 35/216 [00:06<00:34,  5.19it/s]
 17%|█▋        | 36/216 [00:07<00:34,  5.19it/s]
 17%|█▋        | 37/216 [00:07<00:34,  5.19it/s]
 18%|█▊        | 38/

== Status ==
Current time: 2024-03-07 21:41:40 (running for 00:16:29.53)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 RUNNING, 14 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00014 | RUNNING    | 172.19.0.1:11212 |     3.5503e-05  |       

 21%|██        | 45/216 [00:08<00:33,  5.17it/s]
 21%|██▏       | 46/216 [00:09<00:32,  5.18it/s]
 22%|██▏       | 47/216 [00:09<00:32,  5.19it/s]
 22%|██▏       | 48/216 [00:09<00:32,  5.20it/s]
 23%|██▎       | 49/216 [00:09<00:32,  5.20it/s]
 23%|██▎       | 50/216 [00:09<00:32,  5.18it/s]
 24%|██▎       | 51/216 [00:10<00:31,  5.18it/s]
 24%|██▍       | 52/216 [00:10<00:31,  5.19it/s]
 25%|██▍       | 53/216 [00:10<00:31,  5.19it/s]
 25%|██▌       | 54/216 [00:10<00:31,  5.19it/s]
 25%|██▌       | 55/216 [00:10<00:31,  5.17it/s]
 26%|██▌       | 56/216 [00:10<00:30,  5.17it/s]
 26%|██▋       | 57/216 [00:11<00:30,  5.18it/s]
 27%|██▋       | 58/216 [00:11<00:30,  5.19it/s]
 27%|██▋       | 59/216 [00:11<00:30,  5.20it/s]
 28%|██▊       | 60/216 [00:11<00:30,  5.18it/s]
 28%|██▊       | 61/216 [00:11<00:29,  5.19it/s]
 29%|██▊       | 62/216 [00:12<00:29,  5.18it/s]
 29%|██▉       | 63/216 [00:12<00:29,  5.19it/s]
 30%|██▉       | 64/216 [00:12<00:29,  5.20it/s]
 30%|███       | 65/

== Status ==
Current time: 2024-03-07 21:41:45 (running for 00:16:34.56)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 RUNNING, 14 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00014 | RUNNING    | 172.19.0.1:11212 |     3.5503e-05  |       

 32%|███▏      | 70/216 [00:13<00:28,  5.18it/s]
 33%|███▎      | 71/216 [00:13<00:28,  5.17it/s]
 33%|███▎      | 72/216 [00:14<00:26,  5.50it/s]
[36m(_objective pid=11212)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=11212)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.49it/s][A
[36m(_objective pid=11212)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.34it/s][A
[36m(_objective pid=11212)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.67it/s][A


[36m(_objective pid=11212)[0m {'eval_loss': 0.6530306935310364, 'eval_accuracy': 0.6075949367088608, 'eval_runtime': 1.2979, 'eval_samples_per_second': 60.866, 'eval_steps_per_second': 3.852, 'epoch': 1.0}


[36m(_objective pid=11212)[0m 
                                                
 33%|███▎      | 72/216 [00:15<00:26,  5.50it/s]
100%|██████████| 5/5 [00:01<00:00,  4.49it/s][A
                                             [A
 34%|███▍      | 73/216 [00:15<01:22,  1.73it/s]
 34%|███▍      | 74/216 [00:15<01:06,  2.15it/s]
 35%|███▍      | 75/216 [00:15<00:54,  2.61it/s]
 35%|███▌      | 76/216 [00:16<00:45,  3.07it/s]
 36%|███▌      | 77/216 [00:16<00:39,  3.50it/s]
 36%|███▌      | 78/216 [00:16<00:35,  3.86it/s]
 37%|███▋      | 79/216 [00:16<00:33,  4.14it/s]
 37%|███▋      | 80/216 [00:16<00:30,  4.39it/s]
 38%|███▊      | 81/216 [00:17<00:29,  4.59it/s]
 38%|███▊      | 82/216 [00:17<00:28,  4.76it/s]
 38%|███▊      | 83/216 [00:17<00:27,  4.88it/s]
 39%|███▉      | 84/216 [00:17<00:26,  4.96it/s]
 39%|███▉      | 85/216 [00:17<00:26,  5.01it/s]
 40%|███▉      | 86/216 [00:18<00:25,  5.07it/s]
 40%|████      | 87/216 [00:18<00:25,  5.11it/s]
 41%|████      | 88/216 [00:18<00:24

== Status ==
Current time: 2024-03-07 21:41:50 (running for 00:16:39.61)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 RUNNING, 14 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00014 | RUNNING    | 172.19.0.1:11212 |     3.5503e-05  |       

 41%|████      | 89/216 [00:18<00:24,  5.17it/s]
 42%|████▏     | 90/216 [00:18<00:24,  5.16it/s]
 42%|████▏     | 91/216 [00:19<00:24,  5.17it/s]
 43%|████▎     | 92/216 [00:19<00:23,  5.18it/s]
 43%|████▎     | 93/216 [00:19<00:23,  5.17it/s]
 44%|████▎     | 94/216 [00:19<00:23,  5.17it/s]
 44%|████▍     | 95/216 [00:19<00:23,  5.15it/s]
 44%|████▍     | 96/216 [00:19<00:23,  5.16it/s]
 45%|████▍     | 97/216 [00:20<00:22,  5.17it/s]
 45%|████▌     | 98/216 [00:20<00:22,  5.18it/s]
 46%|████▌     | 99/216 [00:20<00:22,  5.19it/s]
 46%|████▋     | 100/216 [00:20<00:22,  5.18it/s]
 47%|████▋     | 101/216 [00:20<00:22,  5.19it/s]
 47%|████▋     | 102/216 [00:21<00:21,  5.20it/s]
 48%|████▊     | 103/216 [00:21<00:21,  5.19it/s]
 48%|████▊     | 104/216 [00:21<00:21,  5.20it/s]
 49%|████▊     | 105/216 [00:21<00:21,  5.20it/s]
 49%|████▉     | 106/216 [00:21<00:21,  5.17it/s]
 50%|████▉     | 107/216 [00:22<00:21,  5.18it/s]
 50%|█████     | 108/216 [00:22<00:20,  5.17it/s]
 50%|█████ 

== Status ==
Current time: 2024-03-07 21:41:55 (running for 00:16:44.65)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 RUNNING, 14 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00014 | RUNNING    | 172.19.0.1:11212 |     3.5503e-05  |       

 53%|█████▎    | 115/216 [00:23<00:19,  5.16it/s]
 54%|█████▎    | 116/216 [00:23<00:19,  5.15it/s]
 54%|█████▍    | 117/216 [00:24<00:19,  5.18it/s]
 55%|█████▍    | 118/216 [00:24<00:19,  5.13it/s]
 55%|█████▌    | 119/216 [00:24<00:18,  5.15it/s]
 56%|█████▌    | 120/216 [00:24<00:18,  5.17it/s]
 56%|█████▌    | 121/216 [00:24<00:18,  5.16it/s]
 56%|█████▋    | 122/216 [00:25<00:18,  5.17it/s]
 57%|█████▋    | 123/216 [00:25<00:17,  5.17it/s]
 57%|█████▋    | 124/216 [00:25<00:17,  5.17it/s]
 58%|█████▊    | 125/216 [00:25<00:17,  5.17it/s]
 58%|█████▊    | 126/216 [00:25<00:17,  5.15it/s]
 59%|█████▉    | 127/216 [00:25<00:17,  5.17it/s]
 59%|█████▉    | 128/216 [00:26<00:16,  5.19it/s]
 60%|█████▉    | 129/216 [00:26<00:16,  5.20it/s]
 60%|██████    | 130/216 [00:26<00:16,  5.20it/s]
 61%|██████    | 131/216 [00:26<00:16,  5.19it/s]
 61%|██████    | 132/216 [00:26<00:16,  5.18it/s]
 62%|██████▏   | 133/216 [00:27<00:15,  5.19it/s]
 62%|██████▏   | 134/216 [00:27<00:15,  5.19it/s]


== Status ==
Current time: 2024-03-07 21:42:00 (running for 00:16:49.68)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 RUNNING, 14 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00014 | RUNNING    | 172.19.0.1:11212 |     3.5503e-05  |       

 65%|██████▌   | 141/216 [00:28<00:14,  5.18it/s]
 66%|██████▌   | 142/216 [00:28<00:14,  5.17it/s]
 66%|██████▌   | 143/216 [00:29<00:14,  5.19it/s]
 67%|██████▋   | 144/216 [00:29<00:13,  5.51it/s]
[36m(_objective pid=11212)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=11212)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.47it/s][A
[36m(_objective pid=11212)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.35it/s][A
[36m(_objective pid=11212)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.67it/s][A


[36m(_objective pid=11212)[0m {'eval_loss': 0.7429614663124084, 'eval_accuracy': 0.5063291139240507, 'eval_runtime': 1.2968, 'eval_samples_per_second': 60.921, 'eval_steps_per_second': 3.856, 'epoch': 2.0}


[36m(_objective pid=11212)[0m 
                                                 
 67%|██████▋   | 144/216 [00:30<00:13,  5.51it/s]
100%|██████████| 5/5 [00:01<00:00,  4.49it/s][A
                                             [A
 67%|██████▋   | 145/216 [00:30<00:40,  1.73it/s]
 68%|██████▊   | 146/216 [00:30<00:32,  2.16it/s]
 68%|██████▊   | 147/216 [00:31<00:26,  2.61it/s]
 69%|██████▊   | 148/216 [00:31<00:22,  3.07it/s]
 69%|██████▉   | 149/216 [00:31<00:19,  3.49it/s]
 69%|██████▉   | 150/216 [00:31<00:17,  3.86it/s]
 70%|██████▉   | 151/216 [00:31<00:15,  4.17it/s]
 70%|███████   | 152/216 [00:32<00:14,  4.43it/s]
 71%|███████   | 153/216 [00:32<00:13,  4.63it/s]
 71%|███████▏  | 154/216 [00:32<00:12,  4.79it/s]
 72%|███████▏  | 155/216 [00:32<00:12,  4.90it/s]
 72%|███████▏  | 156/216 [00:32<00:12,  4.97it/s]
 73%|███████▎  | 157/216 [00:33<00:11,  5.05it/s]
 73%|███████▎  | 158/216 [00:33<00:11,  5.10it/s]
 74%|███████▎  | 159/216 [00:33<00:11,  5.13it/s]
 74%|███████▍  | 16

== Status ==
Current time: 2024-03-07 21:42:05 (running for 00:16:54.70)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 RUNNING, 14 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00014 | RUNNING    | 172.19.0.1:11212 |     3.5503e-05  |       

 75%|███████▍  | 161/216 [00:33<00:10,  5.13it/s]
 75%|███████▌  | 162/216 [00:34<00:10,  5.15it/s]
 75%|███████▌  | 163/216 [00:34<00:10,  5.15it/s]
 76%|███████▌  | 164/216 [00:34<00:10,  5.16it/s]
 76%|███████▋  | 165/216 [00:34<00:09,  5.16it/s]
 77%|███████▋  | 166/216 [00:34<00:09,  5.14it/s]
 77%|███████▋  | 167/216 [00:34<00:09,  5.15it/s]
 78%|███████▊  | 168/216 [00:35<00:09,  5.16it/s]
 78%|███████▊  | 169/216 [00:35<00:09,  5.18it/s]
 79%|███████▊  | 170/216 [00:35<00:08,  5.19it/s]
 79%|███████▉  | 171/216 [00:35<00:08,  5.18it/s]
 80%|███████▉  | 172/216 [00:35<00:08,  5.19it/s]
 80%|████████  | 173/216 [00:36<00:08,  5.19it/s]
 81%|████████  | 174/216 [00:36<00:08,  5.20it/s]
 81%|████████  | 175/216 [00:36<00:07,  5.20it/s]
 81%|████████▏ | 176/216 [00:36<00:07,  5.19it/s]
 82%|████████▏ | 177/216 [00:36<00:07,  5.17it/s]
 82%|████████▏ | 178/216 [00:37<00:07,  5.17it/s]
 83%|████████▎ | 179/216 [00:37<00:07,  5.16it/s]
 83%|████████▎ | 180/216 [00:37<00:06,  5.17it/s]


== Status ==
Current time: 2024-03-07 21:42:10 (running for 00:16:59.73)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 RUNNING, 14 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00014 | RUNNING    | 172.19.0.1:11212 |     3.5503e-05  |       

 87%|████████▋ | 188/216 [00:39<00:05,  5.19it/s]
 88%|████████▊ | 189/216 [00:39<00:05,  5.20it/s]
 88%|████████▊ | 190/216 [00:39<00:05,  5.19it/s]
 88%|████████▊ | 191/216 [00:39<00:04,  5.17it/s]
 89%|████████▉ | 192/216 [00:39<00:04,  5.14it/s]
 89%|████████▉ | 193/216 [00:40<00:04,  5.15it/s]
 90%|████████▉ | 194/216 [00:40<00:04,  5.17it/s]
 90%|█████████ | 195/216 [00:40<00:04,  5.17it/s]
 91%|█████████ | 196/216 [00:40<00:03,  5.17it/s]
 91%|█████████ | 197/216 [00:40<00:03,  5.14it/s]
 92%|█████████▏| 198/216 [00:40<00:03,  5.16it/s]
 92%|█████████▏| 199/216 [00:41<00:03,  5.18it/s]
 93%|█████████▎| 200/216 [00:41<00:03,  5.19it/s]
 93%|█████████▎| 201/216 [00:41<00:02,  5.13it/s]
 94%|█████████▎| 202/216 [00:41<00:02,  5.13it/s]
 94%|█████████▍| 203/216 [00:41<00:02,  5.14it/s]
 94%|█████████▍| 204/216 [00:42<00:02,  5.16it/s]
 95%|█████████▍| 205/216 [00:42<00:02,  5.18it/s]
 95%|█████████▌| 206/216 [00:42<00:01,  5.18it/s]
 96%|█████████▌| 207/216 [00:42<00:01,  5.18it/s]


== Status ==
Current time: 2024-03-07 21:42:15 (running for 00:17:04.77)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (1 RUNNING, 14 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00014 | RUNNING    | 172.19.0.1:11212 |     3.5503e-05  |       

 99%|█████████▉| 214/216 [00:44<00:00,  5.17it/s]
100%|█████████▉| 215/216 [00:44<00:00,  5.18it/s]
100%|██████████| 216/216 [00:44<00:00,  5.50it/s]
[36m(_objective pid=11212)[0m 
  0%|          | 0/5 [00:00<?, ?it/s][A
[36m(_objective pid=11212)[0m 
 40%|████      | 2/5 [00:00<00:00,  7.58it/s][A
[36m(_objective pid=11212)[0m 
 60%|██████    | 3/5 [00:00<00:00,  5.39it/s][A
[36m(_objective pid=11212)[0m 
 80%|████████  | 4/5 [00:00<00:00,  4.69it/s][A
2024-03-07 21:42:17,618	INFO tune.py:1042 -- Total run time: 1026.73 seconds (1026.69 seconds for the tuning loop).


== Status ==
Current time: 2024-03-07 21:42:17 (running for 00:17:06.69)
Using FIFO scheduling algorithm.
Logical resource usage: 1.0/12 CPUs, 1.0/1 GPUs (0.0/1.0 accelerator_type:G)
Result logdir: /home/ai/ray_results/_objective_2024-03-07_21-25-10
Number of trials: 15/15 (15 TERMINATED)
+------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------+
| Trial name             | status     | loc              |   learning_rate |   num_train_epochs |   per_device_train_bat |   weight_decay |   objective |
|                        |            |                  |                 |                    |                ch_size |                |             |
|------------------------+------------+------------------+-----------------+--------------------+------------------------+----------------+-------------|
| _objective_d78da_00000 | TERMINATED | 172.19.0.1:7911  |     5.61152e-06 |                  

In [15]:
best_trial

BestRun(run_id='d78da_00001', objective=0.6582278481012658, hyperparameters={'learning_rate': 1.5751320499779757e-05, 'per_device_train_batch_size': 8, 'num_train_epochs': 3, 'weight_decay': 0.00029375384576328336}, run_summary=<ray.tune.analysis.experiment_analysis.ExperimentAnalysis object at 0x74c6d2530690>)

In [10]:

train_dataset = tokenized_datasets["train"]
eval_dataset = tokenized_datasets["test"]
val_dataset = tokenized_datasets["validation"]
trainer = Trainer(
model=model,
args=training_args,
train_dataset=train_dataset,
eval_dataset=eval_dataset,
compute_metrics=lambda p: {"accuracy": accuracy_score(p.label_ids,
np.argmax(p.predictions,
axis=1))}
)

In [17]:
for n, v in best_trial.hyperparameters.items():
    setattr(trainer.args, n, v)



In [18]:
trainer.args

TrainingArguments(
_n_gpu=1,
accelerator_config={'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True},
adafactor=False,
adam_beta1=0.9,
adam_beta2=0.999,
adam_epsilon=1e-08,
auto_find_batch_size=False,
bf16=False,
bf16_full_eval=False,
data_seed=None,
dataloader_drop_last=False,
dataloader_num_workers=0,
dataloader_persistent_workers=False,
dataloader_pin_memory=True,
dataloader_prefetch_factor=None,
ddp_backend=None,
ddp_broadcast_buffers=None,
ddp_bucket_cap_mb=None,
ddp_find_unused_parameters=None,
ddp_timeout=1800,
debug=[],
deepspeed=None,
disable_tqdm=False,
dispatch_batches=None,
do_eval=True,
do_predict=False,
do_train=False,
eval_accumulation_steps=None,
eval_delay=0,
eval_steps=None,
evaluation_strategy=IntervalStrategy.EPOCH,
fp16=False,
fp16_backend=auto,
fp16_full_eval=False,
fp16_opt_level=O1,
fsdp=[],
fsdp_config={'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False},
fsdp_min_num_params=0,


In [12]:
trainer.train()

Epoch,Training Loss,Validation Loss,Accuracy
1,No log,0.741511,0.552296
2,0.642800,0.634758,0.668367
3,0.463000,0.678941,0.668367


TrainOutput(global_step=1074, training_loss=0.5406307739030494, metrics={'train_runtime': 896.7936, 'train_samples_per_second': 9.574, 'train_steps_per_second': 1.198, 'total_flos': 205189101711360.0, 'train_loss': 0.5406307739030494, 'epoch': 3.0})

In [13]:
trainer.save_model('/home/ai/Downloads/results/last-albert-tweet')

In [14]:
predictions = trainer.evaluate(train_dataset)
print(predictions)

{'eval_loss': 0.2967953383922577, 'eval_accuracy': 0.8881900768693222, 'eval_runtime': 110.7946, 'eval_samples_per_second': 25.832, 'eval_steps_per_second': 1.616, 'epoch': 3.0}


In [15]:
predictions = trainer.evaluate(eval_dataset)
print(predictions)

{'eval_loss': 0.6789411306381226, 'eval_accuracy': 0.6683673469387755, 'eval_runtime': 30.2487, 'eval_samples_per_second': 25.918, 'eval_steps_per_second': 1.62, 'epoch': 3.0}


In [16]:
predictions = trainer.evaluate(val_dataset)
print(predictions)

{'eval_loss': 0.6768719553947449, 'eval_accuracy': 0.6827225130890052, 'eval_runtime': 36.7328, 'eval_samples_per_second': 25.999, 'eval_steps_per_second': 1.633, 'epoch': 3.0}


In [17]:
predictions = trainer.predict(val_dataset)

In [18]:
predictions.predictions

array([[ 1.2853796 , -0.9122284 ],
       [-0.9372214 ,  1.2442471 ],
       [-1.245657  ,  0.97064465],
       ...,
       [-0.94831693,  1.3448441 ],
       [-0.6246013 ,  0.45075762],
       [ 1.3422035 , -1.140004  ]], dtype=float32)

In [19]:
import torch 
predictions.predictions
pre = torch.argmax(torch.tensor(predictions.predictions), dim=1)

In [20]:
true_labels = val_dataset['label']
true_labels

[1,
 0,
 1,
 1,
 1,
 0,
 0,
 0,
 0,
 0,
 0,
 0,
 0,
 1,
 0,
 1,
 0,
 0,
 1,
 0,
 0,
 1,
 1,
 1,
 0,
 0,
 1,
 0,
 0,
 0,
 0,
 0,
 0,
 0,
 1,
 0,
 1,
 1,
 0,
 0,
 0,
 1,
 1,
 1,
 1,
 1,
 0,
 0,
 1,
 0,
 1,
 1,
 0,
 1,
 1,
 1,
 1,
 1,
 0,
 0,
 0,
 1,
 1,
 0,
 1,
 0,
 1,
 1,
 0,
 1,
 1,
 1,
 1,
 0,
 1,
 1,
 0,
 0,
 1,
 0,
 0,
 1,
 1,
 1,
 1,
 0,
 1,
 0,
 0,
 1,
 0,
 1,
 1,
 0,
 1,
 0,
 0,
 0,
 0,
 0,
 0,
 1,
 1,
 0,
 1,
 1,
 1,
 1,
 1,
 0,
 0,
 1,
 1,
 1,
 0,
 0,
 0,
 1,
 1,
 1,
 1,
 1,
 1,
 0,
 0,
 1,
 0,
 1,
 1,
 1,
 1,
 1,
 0,
 1,
 0,
 0,
 1,
 0,
 1,
 0,
 0,
 0,
 1,
 1,
 0,
 1,
 1,
 0,
 1,
 0,
 0,
 1,
 1,
 1,
 1,
 1,
 1,
 0,
 1,
 0,
 0,
 1,
 1,
 1,
 0,
 0,
 0,
 0,
 0,
 1,
 1,
 1,
 0,
 0,
 1,
 0,
 0,
 0,
 1,
 1,
 1,
 0,
 0,
 1,
 1,
 1,
 1,
 1,
 1,
 0,
 1,
 1,
 1,
 0,
 0,
 1,
 1,
 1,
 0,
 0,
 1,
 0,
 1,
 0,
 0,
 0,
 1,
 0,
 1,
 1,
 0,
 1,
 0,
 1,
 0,
 0,
 1,
 1,
 0,
 1,
 1,
 0,
 0,
 0,
 0,
 1,
 0,
 1,
 0,
 0,
 1,
 0,
 0,
 1,
 0,
 1,
 0,
 0,
 0,
 0,
 0,
 0,
 1,
 1,
 1,
 0,
 1,
 0,
 0,
 1,


In [21]:

from sklearn.metrics import confusion_matrix
# Generate predictions, then create and print the confusion matrix
confusion_mat = confusion_matrix(true_labels, pre)
print(confusion_mat)

[[352 147]
 [156 300]]


In [22]:
predictions = trainer.predict(train_dataset)

In [23]:
predictions.predictions

array([[-2.3708892 ,  2.2129304 ],
       [ 0.8304143 , -0.8120435 ],
       [-0.16447178,  0.35819685],
       ...,
       [ 1.3283876 , -0.7837455 ],
       [ 1.7066714 , -1.2829821 ],
       [-0.61844623,  0.29359883]], dtype=float32)

In [24]:
import torch 
predictions.predictions
pre = torch.argmax(torch.tensor(predictions.predictions), dim=1)
pre

tensor([1, 0, 1,  ..., 0, 0, 1])

In [25]:
true_labels = train_dataset['label']
true_labels

[1,
 0,
 1,
 1,
 1,
 1,
 0,
 1,
 1,
 1,
 0,
 0,
 1,
 1,
 0,
 0,
 1,
 0,
 1,
 0,
 0,
 0,
 0,
 1,
 0,
 1,
 1,
 1,
 1,
 1,
 0,
 1,
 1,
 1,
 1,
 0,
 1,
 0,
 1,
 0,
 0,
 1,
 0,
 0,
 1,
 0,
 1,
 0,
 0,
 1,
 1,
 1,
 0,
 0,
 0,
 0,
 1,
 0,
 0,
 0,
 0,
 1,
 0,
 0,
 1,
 1,
 0,
 0,
 0,
 0,
 1,
 1,
 0,
 0,
 0,
 1,
 1,
 1,
 0,
 0,
 1,
 1,
 1,
 0,
 1,
 1,
 1,
 0,
 0,
 0,
 0,
 1,
 0,
 1,
 0,
 1,
 0,
 0,
 0,
 1,
 0,
 1,
 0,
 1,
 1,
 1,
 1,
 0,
 0,
 0,
 0,
 1,
 0,
 1,
 0,
 1,
 1,
 1,
 1,
 1,
 0,
 1,
 1,
 0,
 1,
 1,
 0,
 0,
 0,
 1,
 1,
 1,
 1,
 0,
 0,
 0,
 1,
 0,
 0,
 0,
 0,
 1,
 1,
 1,
 0,
 0,
 0,
 1,
 0,
 0,
 0,
 0,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 1,
 0,
 0,
 1,
 0,
 1,
 1,
 1,
 1,
 1,
 0,
 1,
 1,
 1,
 1,
 0,
 1,
 0,
 0,
 1,
 1,
 0,
 0,
 1,
 1,
 1,
 0,
 1,
 1,
 1,
 1,
 1,
 0,
 0,
 0,
 0,
 0,
 0,
 1,
 0,
 1,
 0,
 1,
 0,
 0,
 0,
 0,
 1,
 0,
 1,
 1,
 0,
 0,
 0,
 0,
 0,
 0,
 1,
 0,
 0,
 0,
 1,
 0,
 0,
 0,
 0,
 0,
 0,
 0,
 1,
 1,
 0,
 0,
 0,
 1,
 1,
 1,
 0,
 0,
 1,
 1,
 1,
 0,
 1,
 1,
 1,
 0,
 1,
 0,
 0,
 0,


In [26]:

from sklearn.metrics import confusion_matrix
# Generate predictions, then create and print the confusion matrix
confusion_mat = confusion_matrix(true_labels, pre)
print(confusion_mat)

[[1281  136]
 [ 184 1261]]


In [20]:
import random
import torch
num_examples = 10
picks = []
lable = []
input = []
prediction = [] 
for i in range(num_examples):
        pick = random.randint(0, len(dataset['validation'])-1)
        while pick in picks:
            pick = random.randint(0, len(dataset)-1)
        picks.append(pick)
        input.append(dataset['validation'][picks[i]]['text'])
        #input_token = tokenizer(dataset['validation'][picks[i]]['text'])
        lable.append(dataset['validation'][picks[i]]['label'])
        encoded_input = tokenizer(dataset['validation'][pick]['text'],return_tensors='pt').to(model.device)
        prediction.append(torch.argmax(trainer.model.forward(**encoded_input).logits, dim=1)[0].cpu().item())
    
    
    


In [21]:
print(input)
print(lable,"lable")
print(prediction,"prediction")



["I bet I'm the first to use that one", 'Chenua Achebe - when things fall apart', '@user @user the upper deck definitely seemed like Philly South.', '@user COD AW SERVERS #OFFLINE', 'My year is ending perfectly😂', "I don't know why it's so fun, but it is. cx I could probably think and find out, but yeah. No. xD", 'Thanks for the AWESOME support on our #instagram page. Much appreciated. #women #motivation #rolemode', 'Now i officially look single. Ha the', 'Porygon2 #are  found in the www.monstermmorpg. com #wild. bulbiest follow @user #working', '@user @user @user @user the Jets have pick 6 in the 2015 draft the irony blows my mind!  #NFLDraft']
[1, 0, 0, 0, 1, 0, 0, 1, 0, 1] lable
[0, 0, 1, 1, 1, 1, 1, 1, 0, 1] prediction
