In [1]:
from ray import tune

In [2]:
from pathlib import Path
from mltrainer import ReportTypes


def train_rnn_with_attention_ray(config):
    import sys
    sys.path.append("/home/azureuser/machinelearning-melissa/networks")
    
    import torch
    from torch import optim
    from ray import tune
    from RNN import RecurrentNeuralNetworkWithAttention, ModelConfig
    from mltrainer import Trainer, TrainerSettings
    from mads_datasets import DatasetFactoryProvider, DatasetType
    from mltrainer.preprocessors import PaddedPreprocessor
    from mltrainer.metrics import Accuracy

    accuracy = Accuracy()
    loss_fn = torch.nn.CrossEntropyLoss()

    # Data
    factory = DatasetFactoryProvider.create_factory(DatasetType.GESTURES)
    preprocessor = PaddedPreprocessor()
    streamers = factory.create_datastreamer(batchsize=32, preprocessor=preprocessor)
    train = streamers["train"]
    valid = streamers["valid"]

    trainstreamer = train.stream()
    validstreamer = valid.stream()

    # Model
    model_config = ModelConfig(
        input_size=3,
        hidden_size=config["hidden_size"],
        num_layers=config["num_layers"],
        output_size=20,
        dropout=config["dropout"]
    )

    model = RecurrentNeuralNetworkWithAttention(model_config)

    settings = TrainerSettings(
        epochs=10, 
        metrics=[accuracy],
        train_steps=len(train),
        logdir=Path("ray_logs"),
        valid_steps=len(valid),
        reporttypes=[ReportTypes.TOML, ReportTypes.TENSORBOARD],
        earlystop_kwargs = {
            "save": False, # save every best model, and restore the best one
            "verbose": True,
            "patience": 5, # number of epochs with no improvement after which training will be stopped
        }
    )

    trainer = Trainer(
        model=model,
        settings=settings,
        loss_fn=loss_fn,
        optimizer=optim.Adam,
        traindataloader=trainstreamer,
        validdataloader=validstreamer,
        scheduler=optim.lr_scheduler.ReduceLROnPlateau,
    )

    trainer.loop()
    metrics, test_loss = trainer.evalbatches()
    print("!!!!!!!!!!!!!! DEBUG metrics dict:", metrics)
    tune.report(metrics=metrics)

In [3]:
search_space = {
    "hidden_size": tune.choice([64, 128, 256, 512]),
    "num_layers": tune.choice([1, 2, 3,4, 5]),
    "dropout": tune.uniform(0.0, 0.5),
    "lr": tune.loguniform(1e-4, 1e-2),
}

In [4]:
from ray.tune import CLIReporter
from ray.tune.schedulers import ASHAScheduler

scheduler = ASHAScheduler(
    metric="Accuracy",  # of "accuracy" als je dat logt
    mode="max",  # of "max" als je accuracy logt
    max_t=10,
    grace_period=1,
    reduction_factor=2
)

reporter = CLIReporter(
    metric_columns=["loss", "accuracy", "training_iteration"]
)

result = tune.run(
    train_rnn_with_attention_ray,
    config=search_space,
    num_samples=10,  # aantal combinaties om te testen
    scheduler=scheduler,
    progress_reporter=reporter,
    resources_per_trial={"cpu": 1, "gpu": 0}  # of {"gpu": 1} als je GPU gebruikt
)


2025-06-04 20:04:35,311	INFO worker.py:1888 -- Started a local Ray instance.
2025-06-04 20:04:36,482	INFO tune.py:253 -- Initializing Ray automatically. For cluster usage or custom Ray initialization, call `ray.init(...)` before `tune.run(...)`.
2025-06-04 20:04:36,486	INFO tune.py:616 -- [output] This uses the legacy output and progress reporter, as Jupyter notebooks are not supported by the new engine, yet. For more information, please see https://github.com/ray-project/ray/issues/36949


== Status ==
Current time: 2025-06-04 20:04:36 (running for 00:00:00.24)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: None
Logical resource usage: 0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (10 PENDING)
+------------------------------------------+----------+-------+-----------+---------------+-------------+--------------+
| Trial name                               | status   | loc   |   dropout |   hidden_size |          lr |   num_layers |
|------------------------------------------+----------+-------+-----------+---------------+-------------+--------------|
| train_rnn_with_attention_ray_23c00_00000 | PENDING  |       | 0.222107  |           512 | 0.00298953  |            2 |
| train_rnn_with_attention_ray_23c00_00001 | PENDING  |       | 0.465705  |        

[36m(train_rnn_with_attention_ray pid=39511)[0m 2025-06-04 20:04:45.236 | INFO     | mads_datasets.base:download_data:121 - Folder already exists at /home/azureuser/.cache/mads_datasets/gestures
  0%|[38;2;30;71;6m          [0m| 0/2600 [00:00<?, ?it/s]
  8%|[38;2;30;71;6m▊         [0m| 201/2600 [00:00<00:01, 2003.81it/s]
 16%|[38;2;30;71;6m█▌        [0m| 406/2600 [00:00<00:01, 2025.35it/s]
  7%|[38;2;30;71;6m▋         [0m| 190/2600 [00:00<00:01, 1897.55it/s]
  8%|[38;2;30;71;6m▊         [0m| 198/2600 [00:00<00:01, 1971.72it/s]
  7%|[38;2;30;71;6m▋         [0m| 193/2600 [00:00<00:01, 1924.98it/s]
 24%|[38;2;30;71;6m██▎       [0m| 611/2600 [00:00<00:00, 2034.14it/s]
 23%|[38;2;30;71;6m██▎       [0m| 596/2600 [00:00<00:01, 1955.19it/s]
 15%|[38;2;30;71;6m█▌        [0m| 396/2600 [00:00<00:01, 1972.65it/s]
 15%|[38;2;30;71;6m█▌        [0m| 391/2600 [00:00<00:01, 1956.56it/s]
 31%|[38;2;30;71;6m███▏      [0m| 815/2600 [00:00<00:00, 2010.43it/s]
 30%|[38;2;30;71;6m███

== Status ==
Current time: 2025-06-04 20:04:46 (running for 00:00:10.29)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: None
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (6 PENDING, 4 RUNNING)
+------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------+
| Trial name                               | status   | loc             |   dropout |   hidden_size |          lr |   num_layers |
|------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING  | 10.0.0.13:39510 | 0.222107  |           512 | 0.00298953  |            2 |
| train_rnn_with_attention_ray_

100%|[38;2;30;71;6m██████████[0m| 2600/2600 [00:01<00:00, 1964.16it/s]
 91%|[38;2;30;71;6m█████████ [0m| 2363/2600 [00:01<00:00, 1944.98it/s]
 91%|[38;2;30;71;6m█████████ [0m| 2363/2600 [00:01<00:00, 1884.69it/s]
 92%|[38;2;30;71;6m█████████▏[0m| 2387/2600 [00:01<00:00, 1936.48it/s]
 29%|[38;2;30;71;6m██▉       [0m| 191/651 [00:00<00:00, 1901.22it/s]
100%|[38;2;30;71;6m██████████[0m| 2600/2600 [00:01<00:00, 1936.60it/s]
 98%|[38;2;30;71;6m█████████▊[0m| 2552/2600 [00:01<00:00, 1883.40it/s]
100%|[38;2;30;71;6m██████████[0m| 2600/2600 [00:01<00:00, 1964.85it/s]
100%|[38;2;30;71;6m██████████[0m| 2600/2600 [00:01<00:00, 1927.18it/s]
 59%|[38;2;30;71;6m█████▊    [0m| 382/651 [00:00<00:00, 1879.15it/s]
 30%|[38;2;30;71;6m██▉       [0m| 195/651 [00:00<00:00, 1943.16it/s]
 29%|[38;2;30;71;6m██▉       [0m| 190/651 [00:00<00:00, 1896.32it/s]
 31%|[38;2;30;71;6m███       [0m| 199/651 [00:00<00:00, 1981.34it/s]
 88%|[38;2;30;71;6m████████▊ [0m| 575/651 [00:00<00:00, 190

== Status ==
Current time: 2025-06-04 20:04:51 (running for 00:00:15.34)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: None
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (6 PENDING, 4 RUNNING)
+------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------+
| Trial name                               | status   | loc             |   dropout |   hidden_size |          lr |   num_layers |
|------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING  | 10.0.0.13:39510 | 0.222107  |           512 | 0.00298953  |            2 |
| train_rnn_with_attention_ray_

[36m(train_rnn_with_attention_ray pid=39511)[0m 
 63%|[38;2;30;71;6m██████▎   [0m| 51/81 [00:02<00:01, 16.78it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 
  4%|[38;2;30;71;6m▎         [0m| 3/81 [00:00<00:02, 28.27it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 21%|[38;2;30;71;6m██        [0m| 17/81 [00:02<00:09,  6.65it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 65%|[38;2;30;71;6m██████▌   [0m| 53/81 [00:03<00:01, 16.96it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 
  9%|[38;2;30;71;6m▊         [0m| 7/81 [00:00<00:02, 32.84it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 25%|[38;2;30;71;6m██▍       [0m| 20/81 [00:02<00:07,  7.63it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 68%|[38;2;30;71;6m██████▊   [0m| 55/81 [00:03<00:01, 17.57it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 
 14%|[38;2;30;71;6m█▎        [0m| 11/81 [00:00<00:02, 33.36it/s][A
[36m(train_rnn_with_attention_ray

== Status ==
Current time: 2025-06-04 20:04:56 (running for 00:00:20.41)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: None
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (6 PENDING, 4 RUNNING)
+------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------+
| Trial name                               | status   | loc             |   dropout |   hidden_size |          lr |   num_layers |
|------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING  | 10.0.0.13:39510 | 0.222107  |           512 | 0.00298953  |            2 |
| train_rnn_with_attention_ray_

[36m(train_rnn_with_attention_ray pid=39511)[0m 
 63%|[38;2;30;71;6m██████▎   [0m| 51/81 [00:02<00:01, 17.01it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 2025-06-04 20:04:54.482 | INFO     | mltrainer.trainer:report:209 - Epoch 1 train 1.2039 test 0.8995 metric ['0.7312'][32m [repeated 2x across cluster][0m
[36m(train_rnn_with_attention_ray pid=39512)[0m 
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:02<00:00, 33.94it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 68%|[38;2;30;71;6m██████▊   [0m| 55/81 [00:07<00:03,  7.72it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 65%|[38;2;30;71;6m██████▌   [0m| 53/81 [00:03<00:01, 17.32it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 63%|[38;2;30;71;6m██████▎   [0m| 51/81 [00:07<00:04,  6.77it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 69%|[38;2;30;71;6m██████▉   [0m| 56/81 [00:07<00:03,  7.68it/s][A
 30%|[38;2;30;71;6m███       [0m| 3/10 [00:07<00:18,  2.63s/it]


== Status ==
Current time: 2025-06-04 20:05:01 (running for 00:00:25.46)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: None
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (6 PENDING, 4 RUNNING)
+------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------+
| Trial name                               | status   | loc             |   dropout |   hidden_size |          lr |   num_layers |
|------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING  | 10.0.0.13:39510 | 0.222107  |           512 | 0.00298953  |            2 |
| train_rnn_with_attention_ray_

[36m(train_rnn_with_attention_ray pid=39511)[0m 
 69%|[38;2;30;71;6m██████▉   [0m| 56/81 [00:03<00:01, 18.40it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 2025-06-04 20:05:01.393 | INFO     | mltrainer.trainer:report:209 - Epoch 0 train 2.2522 test 1.6588 metric ['0.3797'][32m [repeated 4x across cluster][0m
[36m(train_rnn_with_attention_ray pid=39512)[0m 
 89%|[38;2;30;71;6m████████▉ [0m| 72/81 [00:02<00:00, 33.28it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
  5%|[38;2;30;71;6m▍         [0m| 4/81 [00:00<00:11,  6.80it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 72%|[38;2;30;71;6m███████▏  [0m| 58/81 [00:03<00:01, 18.61it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 
 94%|[38;2;30;71;6m█████████▍[0m| 76/81 [00:02<00:00, 33.09it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 74%|[38;2;30;71;6m███████▍  [0m| 60/81 [00:03<00:01, 18.80it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 
 99%|[38;2;30;71

== Status ==
Current time: 2025-06-04 20:05:07 (running for 00:00:30.52)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: None
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (6 PENDING, 4 RUNNING)
+------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------+
| Trial name                               | status   | loc             |   dropout |   hidden_size |          lr |   num_layers |
|------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING  | 10.0.0.13:39510 | 0.222107  |           512 | 0.00298953  |            2 |
| train_rnn_with_attention_ray_

[36m(train_rnn_with_attention_ray pid=39511)[0m 
 77%|[38;2;30;71;6m███████▋  [0m| 62/81 [00:03<00:01, 18.70it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 
 72%|[38;2;30;71;6m███████▏  [0m| 58/81 [00:01<00:00, 29.74it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 79%|[38;2;30;71;6m███████▉  [0m| 64/81 [00:03<00:00, 17.19it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 
 77%|[38;2;30;71;6m███████▋  [0m| 62/81 [00:02<00:00, 31.20it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 41%|[38;2;30;71;6m████      [0m| 33/81 [00:05<00:07,  6.53it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 51%|[38;2;30;71;6m█████     [0m| 41/81 [00:05<00:05,  7.23it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 
 81%|[38;2;30;71;6m████████▏ [0m| 66/81 [00:02<00:00, 31.74it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 42%|[38;2;30;71;6m████▏     [0m| 34/81 [00:05<00:06,  7.01it/s][A
[36m(train_rnn_with_attention_r

== Status ==
Current time: 2025-06-04 20:05:12 (running for 00:00:35.58)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: None
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (6 PENDING, 4 RUNNING)
+------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------+
| Trial name                               | status   | loc             |   dropout |   hidden_size |          lr |   num_layers |
|------------------------------------------+----------+-----------------+-----------+---------------+-------------+--------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING  | 10.0.0.13:39510 | 0.222107  |           512 | 0.00298953  |            2 |
| train_rnn_with_attention_ray_

[36m(train_rnn_with_attention_ray pid=39511)[0m 
 80%|[38;2;30;71;6m████████  [0m| 65/81 [00:03<00:00, 18.59it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 
 64%|[38;2;30;71;6m██████▍   [0m| 52/81 [00:01<00:00, 32.75it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 79%|[38;2;30;71;6m███████▉  [0m| 64/81 [00:09<00:02,  5.74it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 94%|[38;2;30;71;6m█████████▍[0m| 76/81 [00:10<00:00,  7.71it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 83%|[38;2;30;71;6m████████▎ [0m| 67/81 [00:03<00:00, 18.77it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 
 69%|[38;2;30;71;6m██████▉   [0m| 56/81 [00:01<00:00, 32.62it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 85%|[38;2;30;71;6m████████▌ [0m| 69/81 [00:03<00:00, 18.57it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 
 74%|[38;2;30;71;6m███████▍  [0m| 60/81 [00:01<00:00, 33.05it/s][A
[36m(train_rnn_with_attention_r

Trial name,Accuracy
train_rnn_with_attention_ray_23c00_00000,0.892188
train_rnn_with_attention_ray_23c00_00001,0.804688
train_rnn_with_attention_ray_23c00_00002,0.964063
train_rnn_with_attention_ray_23c00_00003,0.96875
train_rnn_with_attention_ray_23c00_00004,0.91875
train_rnn_with_attention_ray_23c00_00005,0.828125
train_rnn_with_attention_ray_23c00_00006,0.928125
train_rnn_with_attention_ray_23c00_00007,0.939063
train_rnn_with_attention_ray_23c00_00008,0.934375
train_rnn_with_attention_ray_23c00_00009,0.920312


[36m(train_rnn_with_attention_ray pid=39512)[0m !!!!!!!!!!!!!! DEBUG metrics dict: {'Accuracy': 0.9640625}


[36m(train_rnn_with_attention_ray pid=39511)[0m 
 54%|[38;2;30;71;6m█████▍    [0m| 44/81 [00:02<00:02, 17.83it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
  2%|[38;2;30;71;6m▏         [0m| 2/81 [00:00<00:11,  7.04it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 58%|[38;2;30;71;6m█████▊    [0m| 47/81 [00:02<00:01, 18.67it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
  4%|[38;2;30;71;6m▎         [0m| 3/81 [00:00<00:11,  6.61it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 20%|[38;2;30;71;6m█▉        [0m| 16/81 [00:02<00:09,  6.64it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 62%|[38;2;30;71;6m██████▏   [0m| 50/81 [00:02<00:01, 20.76it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 21%|[38;2;30;71;6m██        [0m| 17/81 [00:02<00:09,  6.80it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
  6%|[38;2;30;71;6m▌         [0m| 5/81 [00:00<00:08,  8.69it/s][A
[36m(train_rnn_with_attention_ray 

== Status ==
Current time: 2025-06-04 20:05:17 (running for 00:00:40.66)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.9640625
Logical resource usage: 3.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (6 PENDING, 3 RUNNING, 1 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:

[36m(train_rnn_with_attention_ray pid=39511)[0m 
 77%|[38;2;30;71;6m███████▋  [0m| 62/81 [00:03<00:01, 10.07it/s][A
[36m(train_rnn_with_attention_ray pid=39512)[0m 2025-06-04 20:05:15.729 | INFO     | mltrainer.trainer:report:209 - Epoch 9 train 0.1248 test 0.1782 metric ['0.9594'][32m [repeated 5x across cluster][0m
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 10%|[38;2;30;71;6m▉         [0m| 8/81 [00:01<00:21,  3.32it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 79%|[38;2;30;71;6m███████▉  [0m| 64/81 [00:04<00:01, 10.27it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 81%|[38;2;30;71;6m████████▏ [0m| 66/81 [00:04<00:01, 11.35it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 11%|[38;2;30;71;6m█         [0m| 9/81 [00:01<00:18,  3.80it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 28%|[38;2;30;71;6m██▊       [0m| 23/81 [00:03<00:16,  3.57it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 84%|[38;2;30;71;

== Status ==
Current time: 2025-06-04 20:05:22 (running for 00:00:45.72)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.9640625
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (6 PENDING, 3 RUNNING, 1 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:

[36m(train_rnn_with_attention_ray pid=39511)[0m 
 83%|[38;2;30;71;6m████████▎ [0m| 67/81 [00:03<00:00, 17.36it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 46%|[38;2;30;71;6m████▌     [0m| 37/81 [00:06<00:06,  6.60it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 65%|[38;2;30;71;6m██████▌   [0m| 53/81 [00:08<00:03,  7.03it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 85%|[38;2;30;71;6m████████▌ [0m| 69/81 [00:03<00:00, 17.07it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 47%|[38;2;30;71;6m████▋     [0m| 38/81 [00:06<00:06,  7.11it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 67%|[38;2;30;71;6m██████▋   [0m| 54/81 [00:08<00:03,  7.24it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 88%|[38;2;30;71;6m████████▊ [0m| 71/81 [00:04<00:00, 16.38it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 48%|[38;2;30;71;6m████▊     [0m| 39/81 [00:07<00:06,  6.49it/s][A
[36m(train_rnn_with_attention_r

== Status ==
Current time: 2025-06-04 20:05:27 (running for 00:00:50.79)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.9640625
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (6 PENDING, 3 RUNNING, 1 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:

[36m(train_rnn_with_attention_ray pid=39511)[0m 
 75%|[38;2;30;71;6m███████▌  [0m| 61/81 [00:03<00:01, 10.77it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 80%|[38;2;30;71;6m████████  [0m| 65/81 [00:11<00:03,  4.43it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 78%|[38;2;30;71;6m███████▊  [0m| 63/81 [00:03<00:01, 12.18it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 80%|[38;2;30;71;6m████████  [0m| 65/81 [00:04<00:01, 13.02it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 81%|[38;2;30;71;6m████████▏ [0m| 66/81 [00:11<00:03,  4.95it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 83%|[38;2;30;71;6m████████▎ [0m| 67/81 [00:12<00:02,  5.36it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 83%|[38;2;30;71;6m████████▎ [0m| 67/81 [00:04<00:01, 13.87it/s][A
 30%|[38;2;30;71;6m███       [0m| 3/10 [00:38<01:31, 13.09s/it]
  0%|[38;2;30;71;6m          [0m| 0/81 [00:00<?, ?it/s][A
[36m(train_rnn_with_atten

== Status ==
Current time: 2025-06-04 20:05:32 (running for 00:00:55.84)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.9640625
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (5 PENDING, 4 RUNNING, 1 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:

[36m(train_rnn_with_attention_ray pid=39511)[0m 
 80%|[38;2;30;71;6m████████  [0m| 65/81 [00:03<00:00, 17.82it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 43%|[38;2;30;71;6m████▎     [0m| 35/81 [00:04<00:05,  7.80it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 83%|[38;2;30;71;6m████████▎ [0m| 67/81 [00:03<00:00, 17.88it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 16%|[38;2;30;71;6m█▌        [0m| 13/81 [00:01<00:09,  6.83it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 17%|[38;2;30;71;6m█▋        [0m| 14/81 [00:02<00:09,  7.04it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 44%|[38;2;30;71;6m████▍     [0m| 36/81 [00:04<00:05,  7.71it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 86%|[38;2;30;71;6m████████▋ [0m| 70/81 [00:03<00:00, 17.72it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 46%|[38;2;30;71;6m████▌     [0m| 37/81 [00:04<00:05,  7.83it/s][A
[36m(train_rnn_with_attention_r

== Status ==
Current time: 2025-06-04 20:05:37 (running for 00:01:00.90)
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.9640625
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (5 PENDING, 4 RUNNING, 1 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:

[36m(train_rnn_with_attention_ray pid=39511)[0m 
 84%|[38;2;30;71;6m████████▍ [0m| 68/81 [00:03<00:00, 16.47it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 59%|[38;2;30;71;6m█████▉    [0m| 48/81 [00:07<00:04,  7.01it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 68%|[38;2;30;71;6m██████▊   [0m| 55/81 [00:00<00:00, 55.59it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 
 86%|[38;2;30;71;6m████████▋ [0m| 70/81 [00:04<00:00, 16.68it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 90%|[38;2;30;71;6m█████████ [0m| 73/81 [00:09<00:01,  6.93it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 77%|[38;2;30;71;6m███████▋  [0m| 62/81 [00:01<00:00, 57.53it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 60%|[38;2;30;71;6m██████    [0m| 49/81 [00:07<00:04,  6.69it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 91%|[38;2;30;71;6m█████████▏[0m| 74/81 [00:09<00:01,  6.73it/s][A
[36m(train_rnn_with_attention_r

[36m(train_rnn_with_attention_ray pid=39511)[0m !!!!!!!!!!!!!! DEBUG metrics dict: {'Accuracy': 0.8046875}


[36m(train_rnn_with_attention_ray pid=39510)[0m 
 69%|[38;2;30;71;6m██████▉   [0m| 56/81 [00:08<00:03,  6.90it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:10<00:00,  7.40it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 52%|[38;2;30;71;6m█████▏    [0m| 42/81 [00:00<00:00, 56.18it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 70%|[38;2;30;71;6m███████   [0m| 57/81 [00:08<00:03,  7.13it/s][A
[36m(train_rnn_with_attention_ray pid=39511)[0m 2025-06-04 20:05:38.420 | INFO     | mltrainer.trainer:report:209 - Epoch 9 train 0.5226 test 0.5198 metric ['0.8047'][32m [repeated 4x across cluster][0m
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 59%|[38;2;30;71;6m█████▉    [0m| 48/81 [00:00<00:00, 55.09it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 72%|[38;2;30;71;6m███████▏  [0m| 58/81 [00:08<00:03,  6.82it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 72%|[38;2;30;7

== Status ==
Current time: 2025-06-04 20:05:42 (running for 00:01:05.91)
Using AsyncHyperBand: num_stopped=1
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.884375
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (5 PENDING, 3 RUNNING, 2 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:3

[36m(train_rnn_with_attention_ray pid=39513)[0m 
 28%|[38;2;30;71;6m██▊       [0m| 23/81 [00:03<00:07,  7.30it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 28%|[38;2;30;71;6m██▊       [0m| 23/81 [00:00<00:01, 53.11it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 30%|[38;2;30;71;6m██▉       [0m| 24/81 [00:03<00:07,  7.78it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 36%|[38;2;30;71;6m███▌      [0m| 29/81 [00:00<00:00, 54.38it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 31%|[38;2;30;71;6m███       [0m| 25/81 [00:03<00:07,  7.66it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 44%|[38;2;30;71;6m████▍     [0m| 36/81 [00:00<00:00, 57.20it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 52%|[38;2;30;71;6m█████▏    [0m| 42/81 [00:00<00:00, 57.06it/s][A
  0%|[38;2;30;71;6m          [0m| 0/81 [00:00<?, ?it/s][A[32m [repeated 5x across cluster][0m
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 32

== Status ==
Current time: 2025-06-04 20:05:47 (running for 00:01:10.97)
Using AsyncHyperBand: num_stopped=1
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.884375
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (5 PENDING, 3 RUNNING, 2 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:3

[36m(train_rnn_with_attention_ray pid=39510)[0m 
 38%|[38;2;30;71;6m███▊      [0m| 31/81 [00:04<00:06,  8.08it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 74%|[38;2;30;71;6m███████▍  [0m| 60/81 [00:08<00:02,  7.42it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 53%|[38;2;30;71;6m█████▎    [0m| 43/81 [00:00<00:00, 53.67it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 75%|[38;2;30;71;6m███████▌  [0m| 61/81 [00:08<00:02,  7.96it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 60%|[38;2;30;71;6m██████    [0m| 49/81 [00:00<00:00, 54.63it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 40%|[38;2;30;71;6m███▉      [0m| 32/81 [00:04<00:06,  7.44it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 77%|[38;2;30;71;6m███████▋  [0m| 62/81 [00:08<00:02,  7.87it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 
 68%|[38;2;30;71;6m██████▊   [0m| 55/81 [00:01<00:00, 55.66it/s][A
[36m(train_rnn_with_attention_r

[36m(train_rnn_with_attention_ray pid=39723)[0m !!!!!!!!!!!!!! DEBUG metrics dict: {'Accuracy': 0.91875}


[36m(train_rnn_with_attention_ray pid=39510)[0m 
 48%|[38;2;30;71;6m████▊     [0m| 39/81 [00:05<00:05,  8.17it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 84%|[38;2;30;71;6m████████▍ [0m| 68/81 [00:09<00:01,  7.33it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 49%|[38;2;30;71;6m████▉     [0m| 40/81 [00:05<00:04,  8.49it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 85%|[38;2;30;71;6m████████▌ [0m| 69/81 [00:09<00:01,  7.63it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 51%|[38;2;30;71;6m█████     [0m| 41/81 [00:05<00:04,  8.72it/s][A
[36m(train_rnn_with_attention_ray pid=39723)[0m 2025-06-04 20:05:48.388 | INFO     | mltrainer.trainer:report:209 - Epoch 9 train 0.2552 test 0.2812 metric ['0.9203'][32m [repeated 3x across cluster][0m
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 52%|[38;2;30;71;6m█████▏    [0m| 42/81 [00:05<00:04,  8.02it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 88%|[38;2;30;7

== Status ==
Current time: 2025-06-04 20:05:52 (running for 00:01:16.00)
Using AsyncHyperBand: num_stopped=1
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (4 PENDING, 3 RUNNING, 3 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:39

[36m(train_rnn_with_attention_ray pid=39510)[0m 
 81%|[38;2;30;71;6m████████▏ [0m| 66/81 [00:09<00:02,  7.39it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
  9%|[38;2;30;71;6m▊         [0m| 7/81 [00:01<00:12,  5.72it/s][A
 34%|[38;2;30;71;6m███▎      [0m| 875/2600 [00:00<00:01, 1364.03it/s]
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 10%|[38;2;30;71;6m▉         [0m| 8/81 [00:01<00:11,  6.20it/s][A
 40%|[38;2;30;71;6m███▉      [0m| 1039/2600 [00:00<00:01, 1446.94it/s]
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 83%|[38;2;30;71;6m████████▎ [0m| 67/81 [00:09<00:01,  7.26it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 11%|[38;2;30;71;6m█         [0m| 9/81 [00:01<00:10,  6.70it/s][A
 46%|[38;2;30;71;6m████▌     [0m| 1199/2600 [00:00<00:00, 1491.18it/s]
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 84%|[38;2;30;71;6m████████▍ [0m| 68/81 [00:09<00:01,  7.38it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 12%|[3

== Status ==
Current time: 2025-06-04 20:05:57 (running for 00:01:21.07)
Using AsyncHyperBand: num_stopped=1
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (4 PENDING, 3 RUNNING, 3 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:39

[36m(train_rnn_with_attention_ray pid=39798)[0m 
  9%|[38;2;30;71;6m▊         [0m| 7/81 [00:00<00:01, 66.63it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 19%|[38;2;30;71;6m█▊        [0m| 15/81 [00:02<00:09,  6.94it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 56%|[38;2;30;71;6m█████▌    [0m| 45/81 [00:06<00:04,  7.83it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 20%|[38;2;30;71;6m█▉        [0m| 16/81 [00:02<00:09,  7.01it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 57%|[38;2;30;71;6m█████▋    [0m| 46/81 [00:06<00:04,  7.97it/s][A
[36m(train_rnn_with_attention_ray pid=39798)[0m 
 19%|[38;2;30;71;6m█▊        [0m| 15/81 [00:00<00:00, 69.16it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 58%|[38;2;30;71;6m█████▊    [0m| 47/81 [00:06<00:04,  7.89it/s][A
[36m(train_rnn_with_attention_ray pid=39798)[0m 
 28%|[38;2;30;71;6m██▊       [0m| 23/81 [00:00<00:00, 69.93it/s][A
[36m(train_rnn_with_attention_ra

== Status ==
Current time: 2025-06-04 20:06:02 (running for 00:01:26.17)
Using AsyncHyperBand: num_stopped=1
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (3 PENDING, 4 RUNNING, 3 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:39

[36m(train_rnn_with_attention_ray pid=39513)[0m 
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:11<00:00,  7.20it/s][A
[36m(train_rnn_with_attention_ray pid=39798)[0m 
 69%|[38;2;30;71;6m██████▉   [0m| 56/81 [00:00<00:00, 73.02it/s][A
 89%|[38;2;30;71;6m████████▉ [0m| 2312/2600 [00:01<00:00, 1505.54it/s]
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 62%|[38;2;30;71;6m██████▏   [0m| 50/81 [00:07<00:04,  7.61it/s][A
[36m(train_rnn_with_attention_ray pid=39798)[0m 
 79%|[38;2;30;71;6m███████▉  [0m| 64/81 [00:00<00:00, 71.82it/s][A
 95%|[38;2;30;71;6m█████████▌[0m| 2475/2600 [00:01<00:00, 1540.63it/s]
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 63%|[38;2;30;71;6m██████▎   [0m| 51/81 [00:07<00:04,  7.47it/s][A
[36m(train_rnn_with_attention_ray pid=39798)[0m 
 89%|[38;2;30;71;6m████████▉ [0m| 72/81 [00:00<00:00, 74.10it/s][A
100%|[38;2;30;71;6m██████████[0m| 2600/2600 [00:01<00:00, 1523.66it/s]
  0%|[38;2;30;71;6m          [0m| 0/651 [00:00<?, ?it

[36m(train_rnn_with_attention_ray pid=39798)[0m !!!!!!!!!!!!!! DEBUG metrics dict: {'Accuracy': 0.828125}


[36m(train_rnn_with_attention_ray pid=39867)[0m 
 89%|[38;2;30;71;6m████████▉ [0m| 72/81 [00:02<00:00, 38.37it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 40%|[38;2;30;71;6m███▉      [0m| 32/81 [00:04<00:07,  6.67it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 94%|[38;2;30;71;6m█████████▍[0m| 76/81 [00:02<00:00, 37.20it/s][A


== Status ==
Current time: 2025-06-04 20:06:07 (running for 00:01:31.23)
Using AsyncHyperBand: num_stopped=2
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.8734375
Logical resource usage: 3.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (3 PENDING, 3 RUNNING, 4 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:

[36m(train_rnn_with_attention_ray pid=39513)[0m 
 41%|[38;2;30;71;6m████      [0m| 33/81 [00:04<00:06,  6.88it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 99%|[38;2;30;71;6m█████████▉[0m| 80/81 [00:02<00:00, 36.90it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 42%|[38;2;30;71;6m████▏     [0m| 34/81 [00:04<00:06,  7.03it/s][A
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:02<00:00, 35.71it/s]
 60%|[38;2;30;71;6m██████    [0m| 6/10 [01:18<00:51, 12.88s/it]
 10%|[38;2;30;71;6m█         [0m| 1/10 [00:02<00:21,  2.42s/it]
[36m(train_rnn_with_attention_ray pid=39510)[0m 
  1%|[38;2;30;71;6m          [0m| 1/81 [00:00<00:16,  4.79it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 43%|[38;2;30;71;6m████▎     [0m| 35/81 [00:04<00:07,  5.76it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
  4%|[38;2;30;71;6m▎         [0m| 3/81 [00:00<00:04, 16.61it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
  2%|[38;2;30;71;6m▏     

== Status ==
Current time: 2025-06-04 20:06:12 (running for 00:01:36.28)
Using AsyncHyperBand: num_stopped=2
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.8734375
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (3 PENDING, 3 RUNNING, 4 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:

[36m(train_rnn_with_attention_ray pid=39510)[0m 
 38%|[38;2;30;71;6m███▊      [0m| 31/81 [00:04<00:06,  7.26it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 80%|[38;2;30;71;6m████████  [0m| 65/81 [00:09<00:02,  7.40it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 40%|[38;2;30;71;6m███▉      [0m| 32/81 [00:01<00:01, 31.28it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 40%|[38;2;30;71;6m███▉      [0m| 32/81 [00:04<00:06,  7.26it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 44%|[38;2;30;71;6m████▍     [0m| 36/81 [00:01<00:01, 31.70it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 81%|[38;2;30;71;6m████████▏ [0m| 66/81 [00:09<00:02,  7.22it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 49%|[38;2;30;71;6m████▉     [0m| 40/81 [00:01<00:01, 31.47it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 41%|[38;2;30;71;6m████      [0m| 33/81 [00:05<00:06,  7.37it/s][A
[36m(train_rnn_with_attention_r

== Status ==
Current time: 2025-06-04 20:06:17 (running for 00:01:41.34)
Using AsyncHyperBand: num_stopped=2
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.8734375
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (3 PENDING, 3 RUNNING, 4 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:

[36m(train_rnn_with_attention_ray pid=39510)[0m 
 83%|[38;2;30;71;6m████████▎ [0m| 67/81 [00:09<00:01,  7.58it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 17%|[38;2;30;71;6m█▋        [0m| 14/81 [00:02<00:09,  7.09it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 28%|[38;2;30;71;6m██▊       [0m| 23/81 [00:00<00:01, 33.29it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 84%|[38;2;30;71;6m████████▍ [0m| 68/81 [00:10<00:01,  7.51it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 19%|[38;2;30;71;6m█▊        [0m| 15/81 [00:02<00:08,  7.38it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 33%|[38;2;30;71;6m███▎      [0m| 27/81 [00:00<00:01, 32.22it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 85%|[38;2;30;71;6m████████▌ [0m| 69/81 [00:10<00:01,  7.53it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 20%|[38;2;30;71;6m█▉        [0m| 16/81 [00:02<00:08,  7.42it/s][A
[36m(train_rnn_with_attention_r

== Status ==
Current time: 2025-06-04 20:06:22 (running for 00:01:46.36)
Using AsyncHyperBand: num_stopped=2
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.8734375
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (2 PENDING, 4 RUNNING, 4 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:

[36m(train_rnn_with_attention_ray pid=39510)[0m 
 15%|[38;2;30;71;6m█▍        [0m| 12/81 [00:01<00:11,  6.26it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 59%|[38;2;30;71;6m█████▉    [0m| 48/81 [00:06<00:04,  6.70it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 15%|[38;2;30;71;6m█▍        [0m| 12/81 [00:00<00:01, 35.74it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 16%|[38;2;30;71;6m█▌        [0m| 13/81 [00:02<00:10,  6.38it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 60%|[38;2;30;71;6m██████    [0m| 49/81 [00:07<00:05,  6.38it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 20%|[38;2;30;71;6m█▉        [0m| 16/81 [00:00<00:01, 35.08it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 26%|[38;2;30;71;6m██▌       [0m| 21/81 [00:00<00:01, 36.64it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 17%|[38;2;30;71;6m█▋        [0m| 14/81 [00:02<00:10,  6.22it/s][A
[36m(train_rnn_with_attention_r

== Status ==
Current time: 2025-06-04 20:06:27 (running for 00:01:51.42)
Using AsyncHyperBand: num_stopped=2
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.8734375
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (2 PENDING, 4 RUNNING, 4 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:

[36m(train_rnn_with_attention_ray pid=39510)[0m 
 54%|[38;2;30;71;6m█████▍    [0m| 44/81 [00:07<00:05,  6.26it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:11<00:00,  6.75it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 20%|[38;2;30;71;6m█▉        [0m| 16/81 [00:00<00:01, 34.52it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 52%|[38;2;30;71;6m█████▏    [0m| 42/81 [00:02<00:02, 14.67it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 56%|[38;2;30;71;6m█████▌    [0m| 45/81 [00:07<00:05,  6.55it/s][A
[36m(train_rnn_with_attention_ray pid=39867)[0m 
 25%|[38;2;30;71;6m██▍       [0m| 20/81 [00:00<00:01, 32.43it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 54%|[38;2;30;71;6m█████▍    [0m| 44/81 [00:03<00:02, 14.46it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 57%|[38;2;30;71;6m█████▋    [0m| 46/81 [00:07<00:05,  6.90it/s][A
[36m(train_rnn_with_attention_r

[36m(train_rnn_with_attention_ray pid=39867)[0m !!!!!!!!!!!!!! DEBUG metrics dict: {'Accuracy': 0.928125}


[36m(train_rnn_with_attention_ray pid=39513)[0m 
 33%|[38;2;30;71;6m███▎      [0m| 27/81 [00:04<00:07,  6.79it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 37%|[38;2;30;71;6m███▋      [0m| 30/81 [00:01<00:03, 15.64it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 94%|[38;2;30;71;6m█████████▍[0m| 76/81 [00:11<00:00,  7.12it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 40%|[38;2;30;71;6m███▉      [0m| 32/81 [00:02<00:03, 16.06it/s][A


== Status ==
Current time: 2025-06-04 20:06:32 (running for 00:01:56.42)
Using AsyncHyperBand: num_stopped=2
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 3.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (2 PENDING, 3 RUNNING, 5 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:39

[36m(train_rnn_with_attention_ray pid=39513)[0m 
 35%|[38;2;30;71;6m███▍      [0m| 28/81 [00:04<00:08,  6.46it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 42%|[38;2;30;71;6m████▏     [0m| 34/81 [00:02<00:02, 16.14it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 96%|[38;2;30;71;6m█████████▋[0m| 78/81 [00:12<00:00,  7.76it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 36%|[38;2;30;71;6m███▌      [0m| 29/81 [00:04<00:08,  6.47it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 98%|[38;2;30;71;6m█████████▊[0m| 79/81 [00:12<00:00,  7.33it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 44%|[38;2;30;71;6m████▍     [0m| 36/81 [00:02<00:02, 15.66it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 99%|[38;2;30;71;6m█████████▉[0m| 80/81 [00:12<00:00,  7.27it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 37%|[38;2;30;71;6m███▋      [0m| 30/81 [00:04<00:07,  6.48it/s][A
[36m(train_rnn_with_attention_r

== Status ==
Current time: 2025-06-04 20:06:37 (running for 00:02:01.48)
Using AsyncHyperBand: num_stopped=2
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (2 PENDING, 3 RUNNING, 5 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:39

[36m(train_rnn_with_attention_ray pid=39510)[0m 
 26%|[38;2;30;71;6m██▌       [0m| 21/81 [00:03<00:07,  7.75it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 78%|[38;2;30;71;6m███████▊  [0m| 63/81 [00:09<00:02,  7.56it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 79%|[38;2;30;71;6m███████▉  [0m| 64/81 [00:09<00:02,  7.58it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 15%|[38;2;30;71;6m█▍        [0m| 12/81 [00:00<00:04, 14.25it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 27%|[38;2;30;71;6m██▋       [0m| 22/81 [00:03<00:08,  7.18it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 80%|[38;2;30;71;6m████████  [0m| 65/81 [00:09<00:02,  7.68it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 17%|[38;2;30;71;6m█▋        [0m| 14/81 [00:00<00:04, 14.25it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 28%|[38;2;30;71;6m██▊       [0m| 23/81 [00:03<00:07,  7.29it/s][A
[36m(train_rnn_with_attention_r

== Status ==
Current time: 2025-06-04 20:06:43 (running for 00:02:06.53)
Using AsyncHyperBand: num_stopped=2
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (2 PENDING, 3 RUNNING, 5 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:39

[36m(train_rnn_with_attention_ray pid=39510)[0m 
 68%|[38;2;30;71;6m██████▊   [0m| 55/81 [00:08<00:03,  6.92it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 19%|[38;2;30;71;6m█▊        [0m| 15/81 [00:01<00:08,  7.92it/s][A
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:05<00:00, 14.19it/s]
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 69%|[38;2;30;71;6m██████▉   [0m| 56/81 [00:08<00:03,  7.27it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 20%|[38;2;30;71;6m█▉        [0m| 16/81 [00:02<00:08,  7.73it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 70%|[38;2;30;71;6m███████   [0m| 57/81 [00:08<00:03,  7.58it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 21%|[38;2;30;71;6m██        [0m| 17/81 [00:02<00:08,  7.62it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 72%|[38;2;30;71;6m███████▏  [0m| 58/81 [00:08<00:02,  7.73it/s][A
 30%|[38;2;30;71;6m███       [0m| 3/10 [00:18<00:42,  6.13s/it]
  0%|[38;2;30;71;6m

== Status ==
Current time: 2025-06-04 20:06:48 (running for 00:02:11.54)
Using AsyncHyperBand: num_stopped=2
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (1 PENDING, 4 RUNNING, 5 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:39

[36m(train_rnn_with_attention_ray pid=39510)[0m 
  5%|[38;2;30;71;6m▍         [0m| 4/81 [00:00<00:12,  5.97it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 65%|[38;2;30;71;6m██████▌   [0m| 53/81 [00:07<00:03,  7.07it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 86%|[38;2;30;71;6m████████▋ [0m| 70/81 [00:04<00:00, 13.71it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
  6%|[38;2;30;71;6m▌         [0m| 5/81 [00:00<00:13,  5.84it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 67%|[38;2;30;71;6m██████▋   [0m| 54/81 [00:07<00:03,  7.35it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 89%|[38;2;30;71;6m████████▉ [0m| 72/81 [00:05<00:00, 13.92it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
  7%|[38;2;30;71;6m▋         [0m| 6/81 [00:00<00:11,  6.59it/s][A
  0%|[38;2;30;71;6m          [0m| 0/81 [00:00<?, ?it/s][A
[36m(train_rnn_with_attention_ray pid=39513)[0m 
 68%|[38;2;30;71;6m██████▊   [0m| 55/81 [0

== Status ==
Current time: 2025-06-04 20:06:53 (running for 00:02:16.59)
Using AsyncHyperBand: num_stopped=2
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (1 PENDING, 4 RUNNING, 5 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 10.0.0.13:39

[36m(train_rnn_with_attention_ray pid=39510)[0m 
 44%|[38;2;30;71;6m████▍     [0m| 36/81 [00:05<00:07,  5.97it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 69%|[38;2;30;71;6m██████▉   [0m| 56/81 [00:03<00:01, 14.70it/s][A
 10%|[38;2;30;71;6m█         [0m| 1/10 [00:03<00:30,  3.36s/it]
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 46%|[38;2;30;71;6m████▌     [0m| 37/81 [00:05<00:06,  6.42it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
  4%|[38;2;30;71;6m▎         [0m| 3/81 [00:00<00:02, 28.03it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 72%|[38;2;30;71;6m███████▏  [0m| 58/81 [00:04<00:01, 13.74it/s][A


[36m(train_rnn_with_attention_ray pid=39513)[0m !!!!!!!!!!!!!! DEBUG metrics dict: {'Accuracy': 0.96875}


[36m(train_rnn_with_attention_ray pid=39510)[0m 
 48%|[38;2;30;71;6m████▊     [0m| 39/81 [00:05<00:05,  7.67it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 74%|[38;2;30;71;6m███████▍  [0m| 60/81 [00:04<00:01, 13.73it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
  7%|[38;2;30;71;6m▋         [0m| 6/81 [00:00<00:02, 25.68it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 77%|[38;2;30;71;6m███████▋  [0m| 62/81 [00:04<00:01, 14.04it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 11%|[38;2;30;71;6m█         [0m| 9/81 [00:00<00:02, 25.87it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 51%|[38;2;30;71;6m█████     [0m| 41/81 [00:06<00:04,  8.29it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 16%|[38;2;30;71;6m█▌        [0m| 13/81 [00:00<00:02, 30.55it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 79%|[38;2;30;71;6m███████▉  [0m| 64/81 [00:04<00:01, 14.05it/s][A
[36m(train_rnn_with_attention_ray

== Status ==
Current time: 2025-06-04 20:06:58 (running for 00:02:21.62)
Using AsyncHyperBand: num_stopped=2
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.9234374999999999
Logical resource usage: 4.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (1 PENDING, 3 RUNNING, 6 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00000 | RUNNING    | 1

[36m(train_rnn_with_attention_ray pid=39510)[0m 
 86%|[38;2;30;71;6m████████▋ [0m| 70/81 [00:10<00:01,  7.01it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 37%|[38;2;30;71;6m███▋      [0m| 30/81 [00:02<00:03, 13.14it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 60%|[38;2;30;71;6m██████    [0m| 49/81 [00:01<00:01, 28.44it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 40%|[38;2;30;71;6m███▉      [0m| 32/81 [00:02<00:03, 13.31it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 64%|[38;2;30;71;6m██████▍   [0m| 52/81 [00:01<00:01, 27.55it/s][A
[36m(train_rnn_with_attention_ray pid=39510)[0m 
 88%|[38;2;30;71;6m████████▊ [0m| 71/81 [00:10<00:01,  6.38it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 42%|[38;2;30;71;6m████▏     [0m| 34/81 [00:02<00:03, 13.74it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 68%|[38;2;30;71;6m██████▊   [0m| 55/81 [00:01<00:00, 27.71it/s][A
[36m(train_rnn_with_attention_r

[36m(train_rnn_with_attention_ray pid=39510)[0m !!!!!!!!!!!!!! DEBUG metrics dict: {'Accuracy': 0.8921875}


[36m(train_rnn_with_attention_ray pid=39948)[0m 
 96%|[38;2;30;71;6m█████████▋[0m| 78/81 [00:06<00:00, 14.91it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 80%|[38;2;30;71;6m████████  [0m| 65/81 [00:02<00:00, 29.87it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:06<00:00, 13.01it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 84%|[38;2;30;71;6m████████▍ [0m| 68/81 [00:02<00:00, 29.83it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 90%|[38;2;30;71;6m█████████ [0m| 73/81 [00:02<00:00, 34.36it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:02<00:00, 30.80it/s][A
 60%|[38;2;30;71;6m██████    [0m| 6/10 [00:37<00:25,  6.28s/it]
 40%|[38;2;30;71;6m████      [0m| 4/10 [00:12<00:17,  2.99s/it]
[36m(train_rnn_with_attention_ray pid=39948)[0m 
  2%|[38;2;30;71;6m▏         [0m| 2/81 [00:00<00:05, 14.29it/s][A
[36m(train_rnn_with_a

== Status ==
Current time: 2025-06-04 20:07:03 (running for 00:02:26.68)
Using AsyncHyperBand: num_stopped=3
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 3.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (1 PENDING, 2 RUNNING, 7 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00007 | RUNNING    | 10.0.0.13:39

[36m(train_rnn_with_attention_ray pid=39948)[0m 
 22%|[38;2;30;71;6m██▏       [0m| 18/81 [00:01<00:03, 16.49it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 51%|[38;2;30;71;6m█████     [0m| 41/81 [00:00<00:00, 45.64it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 57%|[38;2;30;71;6m█████▋    [0m| 46/81 [00:01<00:00, 45.31it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 25%|[38;2;30;71;6m██▍       [0m| 20/81 [00:01<00:03, 16.21it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 63%|[38;2;30;71;6m██████▎   [0m| 51/81 [00:01<00:00, 44.52it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 27%|[38;2;30;71;6m██▋       [0m| 22/81 [00:01<00:03, 16.07it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 69%|[38;2;30;71;6m██████▉   [0m| 56/81 [00:01<00:00, 41.00it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 30%|[38;2;30;71;6m██▉       [0m| 24/81 [00:01<00:03, 16.60it/s][A
[36m(train_rnn_with_attention_r

== Status ==
Current time: 2025-06-04 20:07:08 (running for 00:02:31.68)
Using AsyncHyperBand: num_stopped=3
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 3.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (3 RUNNING, 7 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00007 | RUNNING    | 10.0.0.13:39948 | 0.254

[36m(train_rnn_with_attention_ray pid=39948)[0m 
 37%|[38;2;30;71;6m███▋      [0m| 30/81 [00:01<00:02, 21.33it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 53%|[38;2;30;71;6m█████▎    [0m| 43/81 [00:01<00:01, 35.29it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 41%|[38;2;30;71;6m████      [0m| 33/81 [00:01<00:02, 20.71it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 59%|[38;2;30;71;6m█████▉    [0m| 48/81 [00:01<00:00, 36.94it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 2025-06-04 20:07:08.295 | INFO     | mltrainer.trainer:__init__:68 - Found earlystop_kwargs in settings.Set to None if you dont want earlystopping.
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 65%|[38;2;30;71;6m██████▌   [0m| 53/81 [00:01<00:00, 38.56it/s][A
  0%|[38;2;30;71;6m          [0m| 0/10 [00:00<?, ?it/s]
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 44%|[38;2;30;71;6m████▍     [0m| 36/81 [00:01<00:02, 18.15it/s][A
[36m(train_rnn_wi

== Status ==
Current time: 2025-06-04 20:07:13 (running for 00:02:36.72)
Using AsyncHyperBand: num_stopped=3
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 3.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (3 RUNNING, 7 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00007 | RUNNING    | 10.0.0.13:39948 | 0.254

[36m(train_rnn_with_attention_ray pid=39948)[0m 
 59%|[38;2;30;71;6m█████▉    [0m| 48/81 [00:01<00:01, 25.54it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 26%|[38;2;30;71;6m██▌       [0m| 21/81 [00:00<00:02, 27.80it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
  9%|[38;2;30;71;6m▊         [0m| 7/81 [00:00<00:04, 18.32it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 63%|[38;2;30;71;6m██████▎   [0m| 51/81 [00:02<00:01, 25.50it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 30%|[38;2;30;71;6m██▉       [0m| 24/81 [00:00<00:02, 27.57it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 11%|[38;2;30;71;6m█         [0m| 9/81 [00:00<00:03, 18.37it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 67%|[38;2;30;71;6m██████▋   [0m| 54/81 [00:02<00:01, 26.38it/s][A
[36m(train_rnn_with_attention_ray pid=40026)[0m 
 33%|[38;2;30;71;6m███▎      [0m| 27/81 [00:01<00:01, 27.62it/s][A
[36m(train_rnn_with_attention_ray

== Status ==
Current time: 2025-06-04 20:07:18 (running for 00:02:41.76)
Using AsyncHyperBand: num_stopped=3
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.91875
Logical resource usage: 3.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (3 RUNNING, 7 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00007 | RUNNING    | 10.0.0.13:39948 | 0.254

[36m(train_rnn_with_attention_ray pid=39948)[0m 
 69%|[38;2;30;71;6m██████▉   [0m| 56/81 [00:03<00:01, 14.66it/s][A
100%|[38;2;30;71;6m██████████[0m| 10/10 [00:28<00:00,  2.86s/it]
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 48%|[38;2;30;71;6m████▊     [0m| 39/81 [00:01<00:01, 22.14it/s][A





[36m(train_rnn_with_attention_ray pid=39948)[0m 
 72%|[38;2;30;71;6m███████▏  [0m| 58/81 [00:03<00:01, 15.33it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 74%|[38;2;30;71;6m███████▍  [0m| 60/81 [00:03<00:01, 16.43it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 52%|[38;2;30;71;6m█████▏    [0m| 42/81 [00:01<00:01, 22.02it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 56%|[38;2;30;71;6m█████▌    [0m| 45/81 [00:01<00:01, 22.34it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 78%|[38;2;30;71;6m███████▊  [0m| 63/81 [00:03<00:00, 19.23it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 59%|[38;2;30;71;6m█████▉    [0m| 48/81 [00:02<00:01, 23.12it/s][A
[36m(train_rnn_with_attention_ray pid=39948)[0m 
 81%|[38;2;30;71;6m████████▏ [0m| 66/81 [00:04<00:00, 21.33it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 63%|[38;2;30;71;6m██████▎   [0m| 51/81 [00:02<00:01, 24.35it/s][A
[36m(train_rnn_with_attention_r

[36m(train_rnn_with_attention_ray pid=39948)[0m !!!!!!!!!!!!!! DEBUG metrics dict: {'Accuracy': 0.9390625}


[36m(train_rnn_with_attention_ray pid=40101)[0m 
 93%|[38;2;30;71;6m█████████▎[0m| 75/81 [00:03<00:00, 24.19it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 96%|[38;2;30;71;6m█████████▋[0m| 78/81 [00:03<00:00, 24.49it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:03<00:00, 23.77it/s][A
 30%|[38;2;30;71;6m███       [0m| 3/10 [00:12<00:27,  3.93s/it]
[36m(train_rnn_with_attention_ray pid=40101)[0m 
  4%|[38;2;30;71;6m▎         [0m| 3/81 [00:00<00:03, 23.34it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
  7%|[38;2;30;71;6m▋         [0m| 6/81 [00:00<00:03, 23.72it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 11%|[38;2;30;71;6m█         [0m| 9/81 [00:00<00:02, 24.15it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 15%|[38;2;30;71;6m█▍        [0m| 12/81 [00:00<00:02, 25.87it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 19%|[38;2;30;71;6m█▊        [0m| 15/

== Status ==
Current time: 2025-06-04 20:07:23 (running for 00:02:46.85)
Using AsyncHyperBand: num_stopped=3
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.928125
Logical resource usage: 1.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (1 RUNNING, 9 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00009 | RUNNING    | 10.0.0.13:40101 | 0.24

[36m(train_rnn_with_attention_ray pid=40101)[0m 
 95%|[38;2;30;71;6m█████████▌[0m| 77/81 [00:02<00:00, 27.59it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 99%|[38;2;30;71;6m█████████▉[0m| 80/81 [00:03<00:00, 26.96it/s][A
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:03<00:00, 26.28it/s]
 40%|[38;2;30;71;6m████      [0m| 4/10 [00:15<00:22,  3.68s/it]
[36m(train_rnn_with_attention_ray pid=40101)[0m 
  4%|[38;2;30;71;6m▎         [0m| 3/81 [00:00<00:02, 28.24it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
  7%|[38;2;30;71;6m▋         [0m| 6/81 [00:00<00:02, 26.65it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 11%|[38;2;30;71;6m█         [0m| 9/81 [00:00<00:02, 26.80it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 15%|[38;2;30;71;6m█▍        [0m| 12/81 [00:00<00:02, 27.93it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 19%|[38;2;30;71;6m█▊        [0m| 15/81 [00:00<00:02, 27.32it/s][A
[36m(train_rnn_with_at

== Status ==
Current time: 2025-06-04 20:07:28 (running for 00:02:51.89)
Using AsyncHyperBand: num_stopped=3
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.928125
Logical resource usage: 1.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (1 RUNNING, 9 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00009 | RUNNING    | 10.0.0.13:40101 | 0.24

[36m(train_rnn_with_attention_ray pid=40101)[0m 
 44%|[38;2;30;71;6m████▍     [0m| 36/81 [00:01<00:01, 25.12it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 48%|[38;2;30;71;6m████▊     [0m| 39/81 [00:01<00:01, 25.28it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 52%|[38;2;30;71;6m█████▏    [0m| 42/81 [00:01<00:01, 25.52it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 56%|[38;2;30;71;6m█████▌    [0m| 45/81 [00:01<00:01, 26.15it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 59%|[38;2;30;71;6m█████▉    [0m| 48/81 [00:01<00:01, 25.70it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 63%|[38;2;30;71;6m██████▎   [0m| 51/81 [00:02<00:01, 26.18it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 67%|[38;2;30;71;6m██████▋   [0m| 54/81 [00:02<00:01, 26.98it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 70%|[38;2;30;71;6m███████   [0m| 57/81 [00:02<00:00, 26.56it/s][A
[36m(train_rnn_with_attention_r

== Status ==
Current time: 2025-06-04 20:07:33 (running for 00:02:56.93)
Using AsyncHyperBand: num_stopped=3
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.928125
Logical resource usage: 1.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (1 RUNNING, 9 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00009 | RUNNING    | 10.0.0.13:40101 | 0.24

[36m(train_rnn_with_attention_ray pid=40101)[0m 
 98%|[38;2;30;71;6m█████████▊[0m| 79/81 [00:02<00:00, 25.98it/s][A
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:03<00:00, 26.35it/s]
[36m(train_rnn_with_attention_ray pid=40101)[0m 2025-06-04 20:07:33.799 | INFO     | mltrainer.trainer:report:209 - Epoch 6 train 0.1361 test 0.1202 metric ['0.9766']
 70%|[38;2;30;71;6m███████   [0m| 7/10 [00:25<00:10,  3.44s/it]
  0%|[38;2;30;71;6m          [0m| 0/81 [00:00<?, ?it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
  4%|[38;2;30;71;6m▎         [0m| 3/81 [00:00<00:03, 21.08it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
  7%|[38;2;30;71;6m▋         [0m| 6/81 [00:00<00:03, 23.97it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 11%|[38;2;30;71;6m█         [0m| 9/81 [00:00<00:02, 25.46it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 15%|[38;2;30;71;6m█▍        [0m| 12/81 [00:00<00:02, 26.00it/s][A
[36m(train_rnn_with_attention_ray 

== Status ==
Current time: 2025-06-04 20:07:38 (running for 00:03:01.96)
Using AsyncHyperBand: num_stopped=3
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.928125
Logical resource usage: 1.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (1 RUNNING, 9 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00009 | RUNNING    | 10.0.0.13:40101 | 0.24

[36m(train_rnn_with_attention_ray pid=40101)[0m 
 40%|[38;2;30;71;6m███▉      [0m| 32/81 [00:01<00:01, 25.37it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 43%|[38;2;30;71;6m████▎     [0m| 35/81 [00:01<00:01, 25.72it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 47%|[38;2;30;71;6m████▋     [0m| 38/81 [00:01<00:01, 26.66it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 51%|[38;2;30;71;6m█████     [0m| 41/81 [00:01<00:01, 26.74it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 54%|[38;2;30;71;6m█████▍    [0m| 44/81 [00:01<00:01, 26.56it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 58%|[38;2;30;71;6m█████▊    [0m| 47/81 [00:01<00:01, 26.77it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 62%|[38;2;30;71;6m██████▏   [0m| 50/81 [00:01<00:01, 24.85it/s][A
[36m(train_rnn_with_attention_ray pid=40101)[0m 
 65%|[38;2;30;71;6m██████▌   [0m| 53/81 [00:02<00:01, 25.42it/s][A
[36m(train_rnn_with_attention_r

== Status ==
Current time: 2025-06-04 20:07:43 (running for 00:03:06.99)
Using AsyncHyperBand: num_stopped=3
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.928125
Logical resource usage: 1.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (1 RUNNING, 9 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------|
| train_rnn_with_attention_ray_23c00_00009 | RUNNING    | 10.0.0.13:40101 | 0.24

[36m(train_rnn_with_attention_ray pid=40101)[0m 
 99%|[38;2;30;71;6m█████████▉[0m| 80/81 [00:02<00:00, 25.94it/s][A
100%|[38;2;30;71;6m██████████[0m| 81/81 [00:03<00:00, 26.76it/s]
[36m(train_rnn_with_attention_ray pid=40101)[0m 2025-06-04 20:07:43.831 | INFO     | mltrainer.trainer:report:209 - Epoch 9 train 0.1506 test 0.2549 metric ['0.9219']
[36m(train_rnn_with_attention_ray pid=40101)[0m 2025-06-04 20:07:43.831 | INFO     | mltrainer.trainer:__call__:252 - best loss: 0.1094, current loss 0.2549.Counter 1/5.
100%|[38;2;30;71;6m██████████[0m| 10/10 [00:35<00:00,  3.55s/it]
2025-06-04 20:07:44,040	INFO tune.py:1009 -- Wrote the latest version of all result files and experiment state to '/home/azureuser/ray_results/train_rnn_with_attention_ray_2025-06-04_20-04-36' in 0.0059s.
2025-06-04 20:07:44,045	INFO tune.py:1041 -- Total run time: 187.56 seconds (187.53 seconds for the tuning loop).


[36m(train_rnn_with_attention_ray pid=40101)[0m !!!!!!!!!!!!!! DEBUG metrics dict: {'Accuracy': 0.9203125}
== Status ==
Current time: 2025-06-04 20:07:44 (running for 00:03:07.53)
Using AsyncHyperBand: num_stopped=4
Bracket: Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: 0.92421875
Logical resource usage: 1.0/4 CPUs, 0/0 GPUs
Result logdir: /tmp/ray/session_2025-06-04_20-04-33_195499_39160/artifacts/2025-06-04_20-04-36/train_rnn_with_attention_ray_2025-06-04_20-04-36/driver_artifacts
Number of trials: 10/10 (10 TERMINATED)
+------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+----------------------+
| Trial name                               | status     | loc             |   dropout |   hidden_size |          lr |   num_layers |   training_iteration |
|------------------------------------------+------------+-----------------+-----------+---------------+-------------+--------------+---

In [11]:
best_result = result.get_best_config(metric="Accuracy", mode="max")

best_trial = result.get_best_trial(metric="Accuracy", mode="max", scope="all")
best_accuracy = best_trial.last_result["Accuracy"]

print(best_result)
print("Beste Accuracy:", best_accuracy)

{'hidden_size': 256, 'num_layers': 5, 'dropout': 0.1846677432423266, 'lr': 0.00028152890123466114}
Beste Accuracy: 0.96875
