# Libraries and Drive

In [1]:
import pandas as pd
import numpy as np
from google.colab import drive
drive.mount("/content/drive", force_remount=True)
import os
os.chdir('/content/drive/My Drive/Volatility_forecasting/')

Mounted at /content/drive


In [2]:
!pip install neuralforecast dask[dataframe]
import os
os.environ['NIXTLA_ID_AS_COL'] = '1'

Collecting neuralforecast
  Downloading neuralforecast-1.7.5-py3-none-any.whl.metadata (14 kB)
Collecting coreforecast>=0.0.6 (from neuralforecast)
  Downloading coreforecast-0.0.15-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (3.8 kB)
Collecting pytorch-lightning>=2.0.0 (from neuralforecast)
  Downloading pytorch_lightning-2.4.0-py3-none-any.whl.metadata (21 kB)
Collecting ray>=2.2.0 (from ray[tune]>=2.2.0->neuralforecast)
  Downloading ray-2.39.0-cp310-cp310-manylinux2014_x86_64.whl.metadata (17 kB)
Collecting optuna (from neuralforecast)
  Downloading optuna-4.1.0-py3-none-any.whl.metadata (16 kB)
Collecting utilsforecast>=0.0.25 (from neuralforecast)
  Downloading utilsforecast-0.2.8-py3-none-any.whl.metadata (7.4 kB)
Collecting dask-expr<1.2,>=1.1 (from dask[dataframe])
  Downloading dask_expr-1.1.19-py3-none-any.whl.metadata (2.6 kB)
INFO: pip is looking at multiple versions of dask-expr to determine which version is compatible with other requirements. This

# Modelling original (20 years total, 14 train, 2 val, 4 test)

In [None]:
from neuralforecast.core import NeuralForecast
from ray import tune
from ray.tune.search.hyperopt import HyperOptSearch
from neuralforecast.losses.pytorch import DistributionLoss
from neuralforecast.auto import  AutoNHITS

In [None]:
df = pd.read_csv('Data/S&P500/3ProSP500.csv')
df['ds'] = pd.to_datetime(df['ds'])
df = df.astype({col: 'int32' if dtype == 'int64' else 'float32' if dtype == 'float64' else dtype
                for col, dtype in df.dtypes.items()})
df = df.rename(columns={'840E': 'y'})
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 2008545 entries, 0 to 2008544
Data columns (total 21 columns):
 #   Column     Dtype         
---  ------     -----         
 0   unique_id  object        
 1   ds         datetime64[ns]
 2   y          float32       
 3   MA(2,9)    int32         
 4   MA(3,9)    int32         
 5   MA(1,12)   int32         
 6   MA(2,12)   int32         
 7   MA(3,12)   int32         
 8   MOM(9)     int32         
 9   MOM(12)    int32         
 10  RSI(7)     int32         
 11  RSI(14)    int32         
 12  EMA(3,9)   int32         
 13  EMA(5,9)   int32         
 14  EMA(5,12)  int32         
 15  DY         float32       
 16  PTBV       float32       
 17  P          float32       
 18  PO         float32       
 19  VO         float32       
 20  PE         float32       
dtypes: datetime64[ns](1), float32(7), int32(12), object(1)
memory usage: 176.2+ MB


In [None]:
start_2020_2023 = '2020-01-01'
end_2020_2023 = '2023-12-31'

start_2018_2019 = '2018-01-01'
end_2018_2019 = '2019-12-31'

# Filter the DataFrame for each time range and extract unique days
unique_days_2020_2023 = df[(df['ds'] >= start_2020_2023) & (df['ds'] <= end_2020_2023)]['ds'].dt.date.unique()
unique_days_2018_2019 = df[(df['ds'] >= start_2018_2019) & (df['ds'] <= end_2018_2019)]['ds'].dt.date.unique()

# Count the number of unique days in each range
count_unique_days_2020_2023 = len(unique_days_2020_2023)
count_unique_days_2018_2019 = len(unique_days_2018_2019)

# Create a summary DataFrame
summary_counts = pd.DataFrame({
    'Period': ['2020-2023', '2018-2019'],
    'Unique Days Covered': [count_unique_days_2020_2023, count_unique_days_2018_2019]
})
summary_counts

Unnamed: 0,Period,Unique Days Covered
0,2020-2023,1043
1,2018-2019,522


In [None]:
import os
from time import time

class AutoNHITSTrainer:
    def __init__(self, horizons, levels, exog_list, df, val_size, test_size):
        self.horizons = horizons
        self.levels = levels
        self.exog_list = exog_list
        self.df = df
        self.val_size = val_size
        self.test_size = test_size

    def check_existing_files(self, horizon):
        """Checks if model and CSV already exist for a given horizon."""
        model_path = f'Trained Models/AutoNHITS/horizon_{horizon}/'
        output_csv = f'Data/Test/nhits_model0_1_horizon_{horizon}.csv'
        return os.path.exists(model_path) and os.path.exists(output_csv)

    def save_results(self, nf, horizon, Y_hat_df):
        """Saves the trained model and prediction results."""
        model_path = f'Trained Models/AutoNHITS/horizon_{horizon}/'
        output_csv = f'Data/Test/horizon_{horizon}/nhits_model0_1_horizon_{horizon}.csv'

        # Create model directory if it doesn't exist
        os.makedirs(model_path, exist_ok=True)

        # Save the model, predictions and hyperparameter search
        for idx, model in enumerate(nf.models):
          hpo = f'HPO/horizon_{horizon}/nhits_model{idx}_horizon_{horizon}_hpo.csv'
          results = model.results.get_dataframe()
          results.to_csv(hpo, index=False)

        nf.save(path=model_path, model_index=None, overwrite=True, save_dataset=False)

        for col in Y_hat_df.select_dtypes(include='float32').columns:
          Y_hat_df[col] = Y_hat_df[col].astype('float16')

        Y_hat_df.to_csv(output_csv, index=False)


    def configure_models(self, horizon):
        """Configures two AutoNHITS models for the given horizon."""
        # Model 0 Configuration
        nhits_config0 = AutoNHITS.get_default_config(h=horizon, backend="ray")
        nhits_config0['random_seed'] = 42
        nhits_config0['learning_rate'] = tune.choice([0.01, 0.005, 0.001, 0.0005, 0.0001, 0.0005, 0.0001, 0.00005, 0.00001])

        # Model 1 Configuration
        nhits_config1 = AutoNHITS.get_default_config(h=horizon, backend="ray")
        nhits_config1['hist_exog_list'] = self.exog_list
        nhits_config1['random_seed'] = 42
        nhits_config1['learning_rate'] = tune.choice([0.01, 0.005, 0.001, 0.0005, 0.0001, 0.0005, 0.0001, 0.00005, 0.00001])

        # Instantiate the models
        nhits_model0 = AutoNHITS(h=horizon,
                                 config=nhits_config0,
                                 search_alg=HyperOptSearch(), num_samples=30,
                                 backend='ray',
                                 loss=DistributionLoss(distribution='StudentT', level=self.levels),
                                 cpus = 12, gpus = 1)

        nhits_model1 = AutoNHITS(h=horizon,
                                 config=nhits_config1,
                                 search_alg=HyperOptSearch(), num_samples=30,
                                 backend='ray',
                                 loss=DistributionLoss(distribution='StudentT', level=self.levels),
                                 cpus = 12, gpus = 1)

        return nhits_model0, nhits_model1

    def run_training(self):
        """Runs the training loop over all horizons."""
        for horizon in self.horizons:
            if self.check_existing_files(horizon):
                print(f"Horizon {horizon}: Model and CSV already exist. Skipping this run.")
                continue

            # Configure the models
            nhits_model0, nhits_model1 = self.configure_models(horizon)

            # Start training and cross-validation
            init = time()
            nf = NeuralForecast(models=[nhits_model0, nhits_model1], freq='B')
            Y_hat_df = nf.cross_validation(df=self.df,
                                           val_size=self.val_size,
                                           test_size=self.test_size,
                                           n_windows=None)

            # Save results
            self.save_results(nf, horizon, Y_hat_df)

            # Log the time taken
            end = time()
            print(f'Horizon {horizon} CV Minutes: {(end - init) / 60}')

In [None]:
exog_list = list(df.columns)
exog_list.remove('ds')
exog_list.remove('y')
exog_list.remove('unique_id')

levels = [90]
val_size = count_unique_days_2018_2019
test_size = count_unique_days_2020_2023
horizons = [1, 5, 10]

In [None]:
trainer = AutoNHITSTrainer(horizons, levels, exog_list, df, val_size, test_size)
trainer.run_training()

Output hidden; open in https://colab.research.google.com to view.

In [None]:
exog_list = list(df.columns)
exog_list.remove('ds')
exog_list.remove('y')
exog_list.remove('unique_id')

levels = [90]
val_size = count_unique_days_2018_2019
test_size = count_unique_days_2020_2023
horizons = [20]

In [None]:
trainer = AutoNHITSTrainer(horizons, levels, exog_list, df, val_size, test_size)
trainer.run_training()

2024-11-12 18:17:40,208	INFO worker.py:1816 -- Started a local Ray instance.
2024-11-12 18:17:41,607	INFO tune.py:253 -- Initializing Ray automatically. For cluster usage or custom Ray initialization, call `ray.init(...)` before `Tuner(...)`.


+--------------------------------------------------------------------+
| Configuration for experiment     _train_tune_2024-11-12_18-17-38   |
+--------------------------------------------------------------------+
| Search algorithm                 SearchGenerator                   |
| Scheduler                        FIFOScheduler                     |
| Number of trials                 30                                |
+--------------------------------------------------------------------+

View detailed results here: /root/ray_results/_train_tune_2024-11-12_18-17-38
To visualize your results with TensorBoard, run: `tensorboard --logdir /tmp/ray/session_2024-11-12_18-17-38_352630_2326/artifacts/2024-11-12_18-17-41/_train_tune_2024-11-12_18-17-38/driver_artifacts`


[36m(_train_tune pid=3770)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=3770)[0m Seed set to 42
[36m(_train_tune pid=3770)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=3770)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=3770)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=3770)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=3770)[0m 2024-11-12 18:17:49.815176: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.716, train_loss_epoch=-0.0958]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.08, train_loss_epoch=-0.946]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.21, train_loss_epoch=-1.08]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.18, train_loss_epoch=-1.09]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.22, train_loss_epoch=-1.13]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.14, train_loss_epoch=-1.10]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.12, train_loss_epoch=-1.11]
[36m(_train_tune pid=3770)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%| 

[36m(_train_tune pid=3770)[0m `Trainer.fit` stopped: `max_steps=1100.0` reached.
2024-11-12 18:18:42,416	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (180, 60, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=3770)[0m 
[36m(_train_tune pid=3770)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:01<00:00,  7.38it/s][A
[36m(_train_tune pid=3770)[0m                                                                         [AEpoch 84:   0%|          | 0/13 [00:01<?, ?it/s, v_num=0, train_loss_step=-1.19, train_loss_epoch=-1.19, valid_loss=-1.23]Epoch 84:   0%|          | 0/13 [00:01<?, ?it/s, v_num=0, train_loss_step=-1.19, train_loss_epoch=-1.19, valid_loss=-1.23]Epoch 84:   0%|          | 0/13 [00:01<?, ?it/s, v_num=0, train_loss_step=-1.19, train_loss_epoch=-1.19, valid_loss=-1.23]


[36m(_train_tune pid=4118)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=4118)[0m Seed set to 42
[36m(_train_tune pid=4118)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=4118)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=4118)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=4118)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=4118)[0m 2024-11-12 18:18:51.009411: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


2024-11-12 18:18:55,261	ERROR tune_controller.py:1331 -- Trial task failed for trial _train_tune_5c12a5b4
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/ray/air/execution/_internal/event_manager.py", line 110, in resolve_future
    result = ray.get(future)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/auto_init_hook.py", line 21, in auto_init_wrapper
    return fn(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/client_mode_hook.py", line 103, in wrapper
    return func(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 2745, in get
    values, debugger_breakpoint = worker.get_objects(object_refs, timeout=timeout)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 901, in get_objects
    raise value.as_instanceof_cause()
ray.exceptions.RayTaskError(OutOfMemoryError): [36mray::ImplicitFunc.train()[39m (pid=4118, ip=172.28.0.12, actor_id


Trial _train_tune_5c12a5b4 errored after 0 iterations at 2024-11-12 18:18:55. Total running time: 1min 13s
Error file: /tmp/ray/session_2024-11-12_18-17-38_352630_2326/artifacts/2024-11-12_18-17-41/_train_tune_2024-11-12_18-17-38/driver_artifacts/_train_tune_5c12a5b4_2_batch_size=256,h=20,input_size=80,learning_rate=0.0005,loss=ref_ph_de895953,max_steps=1500.0000,n_freq_down_2024-11-12_18-17-49/error.txt


[36m(_train_tune pid=4227)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=4227)[0m Seed set to 42
[36m(_train_tune pid=4227)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=4227)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=4227)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=4227)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=4227)[0m 2024-11-12 18:19:02.962189: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
                                                                           
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.33, train_loss_epoch=-1.46]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.08, train_loss_epoch=-1.62]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.76, train_loss_epoch=-1.60]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.48, train_loss_epoch=-1.58]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.00, train_loss_epoch=-1.69]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.46, train_loss_epoch=-1.59]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.80, train_loss_epoch=-1.71]
Epoch 8:   0%|          | 0/4 [00:00

[36m(_train_tune pid=4227)[0m `Trainer.fit` stopped: `max_steps=500.0` reached.
2024-11-12 18:20:06,117	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=4585)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=4585)[0m Seed set to 42
[36m(_train_tune pid=4585)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=4585)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=4585)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=4585)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To prop

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=0.876, train_loss_epoch=2.200]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.453, train_loss_epoch=0.238]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.932, train_loss_epoch=-0.573]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.04, train_loss_epoch=-1.02]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.19, train_loss_epoch=-1.10]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.13, train_loss_epoch=-1.10]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.17, train_loss_epoch=-1.13]
[36m(_train_tune pid=4585)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
Validation DataL

[36m(_train_tune pid=4585)[0m `Trainer.fit` stopped: `max_steps=1000.0` reached.
2024-11-12 18:21:00,083	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=4585)[0m 
[36m(_train_tune pid=4585)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:01<00:00,  7.40it/s][A
[36m(_train_tune pid=4585)[0m                                                                         [AEpoch 76:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.24, train_loss_epoch=-1.20, valid_loss=-1.23]Epoch 76:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.24, train_loss_epoch=-1.20, valid_loss=-1.23]Epoch 76:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.24, train_loss_epoch=-1.20, valid_loss=-1.23]


[36m(_train_tune pid=4868)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=4868)[0m Seed set to 42
[36m(_train_tune pid=4868)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=4868)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=4868)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=4868)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=4868)[0m 2024-11-12 18:21:07.990954: I tensorfl

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.45, train_loss_epoch=-1.14]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.27, train_loss_epoch=-1.65]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.07, train_loss_epoch=-1.79]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.72, train_loss_epoch=-1.84]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.22, train_loss_epoch=-1.93]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.78, train_loss_epoch=-1.90]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.03, train_loss_epoch=-1.94]
[36m(_train_tune pid=4868)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
Validation DataLoad

[36m(_train_tune pid=4868)[0m `Trainer.fit` stopped: `max_steps=1300.0` reached.
2024-11-12 18:22:12,932	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=4868)[0m 
[36m(_train_tune pid=4868)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:01<00:00,  6.84it/s][A
[36m(_train_tune pid=4868)[0m                                                                         [AEpoch 99: 100%|██████████| 13/13 [00:02<00:00,  5.76it/s, v_num=0, train_loss_step=-1.98, train_loss_epoch=-2.03, valid_loss=-2.03]Epoch 99: 100%|██████████| 13/13 [00:02<00:00,  5.76it/s, v_num=0, train_loss_step=-1.98, train_loss_epoch=-2.03, valid_loss=-2.03]Epoch 99: 100%|██████████| 13/13 [00:02<00:00,  5.75it/s, v_num=0, train_loss_step=-1.98, train_loss_epoch=-2.03, valid_loss=-2.03]


[36m(_train_tune pid=5230)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=5230)[0m Seed set to 42
[36m(_train_tune pid=5230)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=5230)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=5230)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=5230)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=5230)[0m 2024-11-12 18:22:21.066134: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.45, train_loss_epoch=-1.47]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-1.57]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.53]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.34, train_loss_epoch=-1.42]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.93, train_loss_epoch=-1.61]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.43, train_loss_epoch=-1.47]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.43, train_loss_epoch=-1.50]
Epoch 8:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.15, train_loss_epoch=-1.44]
Epoch 9: 

[36m(_train_tune pid=5230)[0m `Trainer.fit` stopped: `max_steps=1000.0` reached.
2024-11-12 18:23:40,773	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (24, 12, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=5230)[0m 
[36m(_train_tune pid=5230)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:00<00:00, 15.61it/s][A
[36m(_train_tune pid=5230)[0m                                                                       [AEpoch 249: 100%|██████████| 4/4 [00:00<00:00,  6.16it/s, v_num=0, train_loss_step=-2.03, train_loss_epoch=-1.98, valid_loss=-1.92]Epoch 249: 100%|██████████| 4/4 [00:00<00:00,  6.15it/s, v_num=0, train_loss_step=-2.03, train_loss_epoch=-1.92, valid_loss=-1.92]Epoch 249: 100%|██████████| 4/4 [00:00<00:00,  6.14it/s, v_num=0, train_loss_step=-2.03, train_loss_epoch=-1.92, valid_loss=-1.92]


[36m(_train_tune pid=5658)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=5658)[0m Seed set to 42
[36m(_train_tune pid=5658)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=5658)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=5658)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=5658)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=5658)[0m 2024-11-12 18:23:48.965681: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


2024-11-12 18:23:53,299	ERROR tune_controller.py:1331 -- Trial task failed for trial _train_tune_8be5387b
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/ray/air/execution/_internal/event_manager.py", line 110, in resolve_future
    result = ray.get(future)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/auto_init_hook.py", line 21, in auto_init_wrapper
    return fn(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/client_mode_hook.py", line 103, in wrapper
    return func(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 2745, in get
    values, debugger_breakpoint = worker.get_objects(object_refs, timeout=timeout)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 901, in get_objects
    raise value.as_instanceof_cause()
ray.exceptions.RayTaskError(OutOfMemoryError): [36mray::ImplicitFunc.train()[39m (pid=5658, ip=172.28.0.12, actor_id


Trial _train_tune_8be5387b errored after 0 iterations at 2024-11-12 18:23:53. Total running time: 6min 11s
Error file: /tmp/ray/session_2024-11-12_18-17-38_352630_2326/artifacts/2024-11-12_18-17-41/_train_tune_2024-11-12_18-17-38/driver_artifacts/_train_tune_8be5387b_7_batch_size=256,h=20,input_size=100,learning_rate=0.0010,loss=ref_ph_de895953,max_steps=600.0000,n_freq_down_2024-11-12_18-22-20/error.txt


[36m(_train_tune pid=5766)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=5766)[0m Seed set to 42
[36m(_train_tune pid=5766)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=5766)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=5766)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=5766)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=5766)[0m 2024-11-12 18:24:01.068718: I tensorfl

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.50, train_loss_epoch=-0.98]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-1.59]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.94, train_loss_epoch=-1.64]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.39, train_loss_epoch=-1.62]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.04, train_loss_epoch=-1.65]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.40, train_loss_epoch=-1.64]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.68, train_loss_epoch=-1.66]
[36m(_train_tune pid=5766)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
Validation DataLoad

[36m(_train_tune pid=5766)[0m `Trainer.fit` stopped: `max_steps=900.0` reached.
2024-11-12 18:24:45,347	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (1, 1, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=5766)[0m 
[36m(_train_tune pid=5766)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:01<00:00,  6.83it/s][A
[36m(_train_tune pid=5766)[0m                                                                         [AEpoch 69:   0%|          | 0/13 [00:01<?, ?it/s, v_num=0, train_loss_step=-1.82, train_loss_epoch=-1.66, valid_loss=-1.71] Epoch 69:   0%|          | 0/13 [00:01<?, ?it/s, v_num=0, train_loss_step=-1.82, train_loss_epoch=-1.73, valid_loss=-1.71]Epoch 69:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.82, train_loss_epoch=-1.73, valid_loss=-1.71]


[36m(_train_tune pid=6044)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=6044)[0m Seed set to 42
[36m(_train_tune pid=6044)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=6044)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=6044)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=6044)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=6044)[0m 2024-11-12 18:24:52.922543: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.01, train_loss_epoch=0.568]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.04, train_loss_epoch=-1.38]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.81, train_loss_epoch=-1.56]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.54, train_loss_epoch=-1.63]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.99, train_loss_epoch=-1.69]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.55, train_loss_epoch=-1.71]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.87, train_loss_epoch=-1.80]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.56, train_loss_epoch=-1.79]
Epoch 9: 

[36m(_train_tune pid=6044)[0m `Trainer.fit` stopped: `max_steps=700.0` reached.
2024-11-12 18:25:39,867	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (180, 60, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=6044)[0m 
[36m(_train_tune pid=6044)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.67it/s][A
[36m(_train_tune pid=6044)[0m                                                                       [AEpoch 99: 100%|██████████| 7/7 [00:02<00:00,  3.14it/s, v_num=0, train_loss_step=-2.33, train_loss_epoch=-2.00, valid_loss=-1.98]Epoch 99: 100%|██████████| 7/7 [00:02<00:00,  3.14it/s, v_num=0, train_loss_step=-2.33, train_loss_epoch=-2.04, valid_loss=-1.98]Epoch 99: 100%|██████████| 7/7 [00:02<00:00,  3.14it/s, v_num=0, train_loss_step=-2.33, train_loss_epoch=-2.04, valid_loss=-1.98]


[36m(_train_tune pid=6333)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=6333)[0m Seed set to 42
[36m(_train_tune pid=6333)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=6333)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=6333)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=6333)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=6333)[0m 2024-11-12 18:25:48.030618: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=2.500, train_loss_epoch=4.240]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.48, train_loss_epoch=-0.207]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.42, train_loss_epoch=-1.16]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.31, train_loss_epoch=-1.29]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.70, train_loss_epoch=-1.41]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.38, train_loss_epoch=-1.41]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.56, train_loss_epoch=-1.50]
Epoch 8:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.02, train_loss_epoch=-1.46]
Epoch 9:

[36m(_train_tune pid=6333)[0m `Trainer.fit` stopped: `max_steps=600.0` reached.
2024-11-12 18:26:33,337	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (8, 4, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=6333)[0m 
[36m(_train_tune pid=6333)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:00<00:00, 16.24it/s][A
[36m(_train_tune pid=6333)[0m                                                                       [AEpoch 149: 100%|██████████| 4/4 [00:00<00:00,  6.76it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=-1.51, valid_loss=-1.75]Epoch 149: 100%|██████████| 4/4 [00:00<00:00,  6.75it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=-1.62, valid_loss=-1.75]Epoch 149: 100%|██████████| 4/4 [00:00<00:00,  6.73it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=-1.62, valid_loss=-1.75]


[36m(_train_tune pid=6613)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=6613)[0m Seed set to 42
[36m(_train_tune pid=6613)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=6613)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=6613)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=6613)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=6613)[0m 2024-11-12 18:26:40.967833: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=0.917, train_loss_epoch=0.899]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=0.810, train_loss_epoch=0.862]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=0.783, train_loss_epoch=0.829]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=0.779, train_loss_epoch=0.790]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=0.704, train_loss_epoch=0.736]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=0.632, train_loss_epoch=0.667]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=0.546, train_loss_epoch=0.579]
[36m(_train_tune pid=6613)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|     

[36m(_train_tune pid=6613)[0m `Trainer.fit` stopped: `max_steps=1300.0` reached.2024-11-12 18:27:16,800	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=6613)[0m 
[36m(_train_tune pid=6613)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 49.79it/s][A
[36m(_train_tune pid=6613)[0m                                                                         [AEpoch 99: 100%|██████████| 13/13 [00:00<00:00, 23.65it/s, v_num=0, train_loss_step=-1.16, train_loss_epoch=-1.17, valid_loss=-1.21]Epoch 99: 100%|██████████| 13/13 [00:00<00:00, 23.48it/s, v_num=0, train_loss_step=-1.16, train_loss_epoch=-1.17, valid_loss=-1.21]Epoch 99: 100%|██████████| 13/13 [00:00<00:00, 23.43it/s, v_num=0, train_loss_step=-1.16, train_loss_epoch=-1.17, valid_loss=-1.21]



[36m(_train_tune pid=6856)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=6856)[0m Seed set to 42
[36m(_train_tune pid=6856)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=6856)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=6856)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=6856)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=6856)[0m 2024-11-12 18:27:25.058289: I tensorf

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.958, train_loss_epoch=-0.0748]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.18, train_loss_epoch=-0.931]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.23, train_loss_epoch=-1.11]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.17, train_loss_epoch=-1.11]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.21, train_loss_epoch=-1.15]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.14, train_loss_epoch=-1.14]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.21, train_loss_epoch=-1.17]
[36m(_train_tune pid=6856)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
Validation Data

2024-11-12 18:28:00,497	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=6856)[0m `Trainer.fit` stopped: `max_steps=1300.0` reached.


[36m(_train_tune pid=6856)[0m 
[36m(_train_tune pid=6856)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 50.49it/s][A
[36m(_train_tune pid=6856)[0m                                                                         [AEpoch 99: 100%|██████████| 13/13 [00:00<00:00, 23.85it/s, v_num=0, train_loss_step=-1.20, train_loss_epoch=-1.23, valid_loss=-1.25]Epoch 99: 100%|██████████| 13/13 [00:00<00:00, 23.80it/s, v_num=0, train_loss_step=-1.20, train_loss_epoch=-1.23, valid_loss=-1.25]Epoch 99: 100%|██████████| 13/13 [00:00<00:00, 23.75it/s, v_num=0, train_loss_step=-1.20, train_loss_epoch=-1.23, valid_loss=-1.25]


[36m(_train_tune pid=7100)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=7100)[0m Seed set to 42
[36m(_train_tune pid=7100)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=7100)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=7100)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=7100)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=7100)[0m 2024-11-12 18:28:09.096017: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


2024-11-12 18:28:13,152	ERROR tune_controller.py:1331 -- Trial task failed for trial _train_tune_a6b09eb8
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/ray/air/execution/_internal/event_manager.py", line 110, in resolve_future
    result = ray.get(future)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/auto_init_hook.py", line 21, in auto_init_wrapper
    return fn(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/client_mode_hook.py", line 103, in wrapper
    return func(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 2745, in get
    values, debugger_breakpoint = worker.get_objects(object_refs, timeout=timeout)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 901, in get_objects
    raise value.as_instanceof_cause()
ray.exceptions.RayTaskError(OutOfMemoryError): [36mray::ImplicitFunc.train()[39m (pid=7100, ip=172.28.0.12, actor_id


Trial _train_tune_a6b09eb8 errored after 0 iterations at 2024-11-12 18:28:13. Total running time: 10min 31s
Error file: /tmp/ray/session_2024-11-12_18-17-38_352630_2326/artifacts/2024-11-12_18-17-41/_train_tune_2024-11-12_18-17-38/driver_artifacts/_train_tune_a6b09eb8_13_batch_size=256,h=20,input_size=40,learning_rate=0.0010,loss=ref_ph_de895953,max_steps=1200.0000,n_freq_dow_2024-11-12_18-27-24/error.txt


[36m(_train_tune pid=7210)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=7210)[0m Seed set to 42
[36m(_train_tune pid=7210)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=7210)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=7210)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=7210)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=7210)[0m 2024-11-12 18:28:21.060380: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.40, train_loss_epoch=-1.34]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.04, train_loss_epoch=-1.55]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.77, train_loss_epoch=-1.53]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.26, train_loss_epoch=-1.43]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.91, train_loss_epoch=-1.62]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.50, train_loss_epoch=-1.57]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.70, train_loss_epoch=-1.60]
Epoch 8:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.37, train_loss_epoch=-1.57]
Epoch 8: 

2024-11-12 18:29:50,034	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=7210)[0m `Trainer.fit` stopped: `max_steps=1200.0` reached.


[36m(_train_tune pid=7210)[0m 
[36m(_train_tune pid=7210)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:00<00:00, 15.93it/s][A
[36m(_train_tune pid=7210)[0m                                                                       [AEpoch 299: 100%|██████████| 4/4 [00:00<00:00,  6.77it/s, v_num=0, train_loss_step=-2.09, train_loss_epoch=-2.01, valid_loss=-2.03]Epoch 299: 100%|██████████| 4/4 [00:00<00:00,  6.76it/s, v_num=0, train_loss_step=-2.09, train_loss_epoch=-2.05, valid_loss=-2.03]Epoch 299: 100%|██████████| 4/4 [00:00<00:00,  6.74it/s, v_num=0, train_loss_step=-2.09, train_loss_epoch=-2.05, valid_loss=-2.03]


[36m(_train_tune pid=7674)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=7674)[0m Seed set to 42
[36m(_train_tune pid=7674)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=7674)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=7674)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=7674)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=7674)[0m 2024-11-12 18:29:57.928144: I tensorfl

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.38, train_loss_epoch=0.340]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.30, train_loss_epoch=-1.63]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.90, train_loss_epoch=-1.70]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.57, train_loss_epoch=-1.67]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.15, train_loss_epoch=-1.81]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.57, train_loss_epoch=-1.76]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.86, train_loss_epoch=-1.83]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.48, train_loss_epoch=-1.75]
Epoch 9:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, trai

2024-11-12 18:31:29,607	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=7674)[0m `Trainer.fit` stopped: `max_steps=1400.0` reached.


[36m(_train_tune pid=7674)[0m 
[36m(_train_tune pid=7674)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.67it/s][A
[36m(_train_tune pid=7674)[0m                                                                       [AEpoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.12it/s, v_num=0, train_loss_step=-1.90, train_loss_epoch=-2.06, valid_loss=-2.03]Epoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.12it/s, v_num=0, train_loss_step=-1.90, train_loss_epoch=-2.01, valid_loss=-2.03]Epoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.12it/s, v_num=0, train_loss_step=-1.90, train_loss_epoch=-2.01, valid_loss=-2.03]


[36m(_train_tune pid=8146)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=8146)[0m Seed set to 42
[36m(_train_tune pid=8146)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=8146)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=8146)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=8146)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=8146)[0m 2024-11-12 18:31:38.113999: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/2 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.797, train_loss_epoch=0.877]
Epoch 2:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.325, train_loss_epoch=0.464]
Epoch 3:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.531, train_loss_epoch=-0.299]
Epoch 4:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=1.500, train_loss_epoch=0.533]
Epoch 5:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.472, train_loss_epoch=0.0399]
Epoch 5: 100%|██████████| 2/2 [00:00<00:00,  8.52it/s, v_num=0, train_loss_step=-0.704, train_loss_epoch=-0.154]
Epoch 6:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.704, train_loss_epoch=-0.154]
Epoch 7:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.137, train_loss_epoch=

2024-11-12 18:33:20,332	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=8146)[0m `Trainer.fit` stopped: `max_steps=800.0` reached.


[36m(_train_tune pid=8146)[0m 
[36m(_train_tune pid=8146)[0m Validation DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 11.65it/s][A
[36m(_train_tune pid=8146)[0m                                                                       [AEpoch 399: 100%|██████████| 2/2 [00:00<00:00,  3.65it/s, v_num=0, train_loss_step=-1.19, train_loss_epoch=-1.22, valid_loss=-1.24]Epoch 399: 100%|██████████| 2/2 [00:00<00:00,  3.62it/s, v_num=0, train_loss_step=-1.19, train_loss_epoch=-1.20, valid_loss=-1.24]Epoch 399: 100%|██████████| 2/2 [00:00<00:00,  3.61it/s, v_num=0, train_loss_step=-1.19, train_loss_epoch=-1.20, valid_loss=-1.24]


[36m(_train_tune pid=8667)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=8667)[0m Seed set to 42
[36m(_train_tune pid=8667)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=8667)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=8667)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=8667)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=8667)[0m 2024-11-12 18:33:28.113358: I tensorfl

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.10, train_loss_epoch=-1.30]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.52]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.10, train_loss_epoch=-1.60]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.55, train_loss_epoch=-1.72]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.97, train_loss_epoch=-1.75]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.77, train_loss_epoch=-1.80]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.00, train_loss_epoch=-1.83]
[36m(_train_tune pid=8667)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
Validation DataLoad

2024-11-12 18:33:55,152	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (1, 1, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=8667)[0m `Trainer.fit` stopped: `max_steps=500.0` reached.


[36m(_train_tune pid=8667)[0m 
[36m(_train_tune pid=8667)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:01<00:00,  7.32it/s][A
[36m(_train_tune pid=8667)[0m                                                                         [AEpoch 38:   0%|          | 0/13 [00:01<?, ?it/s, v_num=0, train_loss_step=-1.75, train_loss_epoch=-1.88, valid_loss=-1.92]Epoch 38:   0%|          | 0/13 [00:01<?, ?it/s, v_num=0, train_loss_step=-1.75, train_loss_epoch=-1.98, valid_loss=-1.92]Epoch 38:   0%|          | 0/13 [00:01<?, ?it/s, v_num=0, train_loss_step=-1.75, train_loss_epoch=-1.98, valid_loss=-1.92]


[36m(_train_tune pid=8875)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=8875)[0m Seed set to 42
[36m(_train_tune pid=8875)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=8875)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=8875)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=8875)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=8875)[0m 2024-11-12 18:34:03.136477: I tensorfl

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.61, train_loss_epoch=-1.49]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.22, train_loss_epoch=-1.74]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.13, train_loss_epoch=-1.81]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.75, train_loss_epoch=-1.81]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.30, train_loss_epoch=-1.89]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.89, train_loss_epoch=-1.89]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.84, train_loss_epoch=-1.91]
[36m(_train_tune pid=8875)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
Validation DataLoad

2024-11-12 18:34:29,625	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=8875)[0m `Trainer.fit` stopped: `max_steps=900.0` reached.


[36m(_train_tune pid=8875)[0m 
[36m(_train_tune pid=8875)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 47.46it/s][A
[36m(_train_tune pid=8875)[0m                                                                         [AEpoch 69:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-2.03, valid_loss=-1.97]Epoch 69:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-2.02, valid_loss=-1.97]Epoch 69:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-2.02, valid_loss=-1.97]


[36m(_train_tune pid=9084)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=9084)[0m Seed set to 42
[36m(_train_tune pid=9084)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=9084)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=9084)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=9084)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=9084)[0m 2024-11-12 18:34:38.023364: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.52, train_loss_epoch=-1.50]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.08, train_loss_epoch=-1.76]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.23, train_loss_epoch=-1.74]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.61, train_loss_epoch=-1.82]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.01, train_loss_epoch=-1.84]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.84, train_loss_epoch=-1.86]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.02, train_loss_epoch=-1.87]
[36m(_train_tune pid=9084)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|     

[36m(_train_tune pid=9084)[0m `Trainer.fit` stopped: `max_steps=1200.0` reached.
2024-11-12 18:35:35,971	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (180, 60, 1), 'n_pool_kernel_size': (1, 1, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=9084)[0m 
[36m(_train_tune pid=9084)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:01<00:00,  7.16it/s][A
[36m(_train_tune pid=9084)[0m                                                                         [AEpoch 92:   0%|          | 0/13 [00:01<?, ?it/s, v_num=0, train_loss_step=-2.13, train_loss_epoch=-2.00, valid_loss=-2.02]Epoch 92:   0%|          | 0/13 [00:01<?, ?it/s, v_num=0, train_loss_step=-2.13, train_loss_epoch=-2.06, valid_loss=-2.02]Epoch 92:   0%|          | 0/13 [00:01<?, ?it/s, v_num=0, train_loss_step=-2.13, train_loss_epoch=-2.06, valid_loss=-2.02]


[36m(_train_tune pid=9416)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=9416)[0m Seed set to 42
[36m(_train_tune pid=9416)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=9416)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=9416)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=9416)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=9416)[0m 2024-11-12 18:35:44.184211: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:02<00:00,  0.82it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.33, train_loss_epoch=-1.27]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-1.58]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.86, train_loss_epoch=-1.66]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.40, train_loss_epoch=-1.57]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-1.66]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.60, train_loss_epoch=-1.65]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.76, train_loss_epoch=-1.74]
Epoch 8:   0%|          | 0/4 [00:00

[36m(_train_tune pid=9416)[0m `Trainer.fit` stopped: `max_steps=500.0` reached.
2024-11-12 18:36:42,105	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (1, 1, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=9752)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=9752)[0m Seed set to 42
[36m(_train_tune pid=9752)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=9752)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=9752)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=9752)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To prop

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/2 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.723, train_loss_epoch=0.845]
Epoch 2:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.187, train_loss_epoch=0.0342]
Epoch 3:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=1.190, train_loss_epoch=2.180]
Epoch 4:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.218, train_loss_epoch=0.0407]
Epoch 5:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.474, train_loss_epoch=0.443]
Epoch 6:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.474, train_loss_epoch=0.479]
Epoch 7:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.470, train_loss_epoch=0.480]
Epoch 8:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.399, train_loss_epoch=0.421]
Epoch 

2024-11-12 18:39:01,588	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=9752)[0m `Trainer.fit` stopped: `max_steps=900.0` reached.


[36m(_train_tune pid=9752)[0m 
[36m(_train_tune pid=9752)[0m Validation DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 11.29it/s][A
[36m(_train_tune pid=9752)[0m                                                                       [AEpoch 449: 100%|██████████| 2/2 [00:00<00:00,  3.34it/s, v_num=0, train_loss_step=-1.26, train_loss_epoch=-1.24, valid_loss=-1.24]Epoch 449: 100%|██████████| 2/2 [00:00<00:00,  3.31it/s, v_num=0, train_loss_step=-1.26, train_loss_epoch=-1.24, valid_loss=-1.24]Epoch 449: 100%|██████████| 2/2 [00:00<00:00,  3.31it/s, v_num=0, train_loss_step=-1.26, train_loss_epoch=-1.24, valid_loss=-1.24]


[36m(_train_tune pid=10397)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=10397)[0m Seed set to 42
[36m(_train_tune pid=10397)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=10397)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=10397)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=10397)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=10397)[0m 2024-11-12 18:39:10.140336: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=11.30, train_loss_epoch=163.0]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=0.378, train_loss_epoch=1.380]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.146, train_loss_epoch=1.930]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=0.0514, train_loss_epoch=0.619]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.983, train_loss_epoch=-0.498]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.909, train_loss_epoch=-0.86]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.11, train_loss_epoch=-1.02]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.99, train_loss_epoch=-1.05]
Epoc

[36m(_train_tune pid=10397)[0m `Trainer.fit` stopped: `max_steps=1300.0` reached.
2024-11-12 18:40:31,263	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (24, 12, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=10397)[0m 
[36m(_train_tune pid=10397)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.82it/s][A
[36m(_train_tune pid=10397)[0m                                                                       [AEpoch 185:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.27, train_loss_epoch=-1.22, valid_loss=-1.25]Epoch 185:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.27, train_loss_epoch=-1.24, valid_loss=-1.25]Epoch 185:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.27, train_loss_epoch=-1.24, valid_loss=-1.25]


[36m(_train_tune pid=10824)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=10824)[0m Seed set to 42
[36m(_train_tune pid=10824)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=10824)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=10824)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=10824)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=10824)[0m 2024-11-12 18:40:39.241572: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00,  2.03it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 0: 100%|██████████| 4/4 [00:00<00:00, 10.00it/s, v_num=0, train_loss_step=-1.63, train_loss_epoch=-1.48]
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.63, train_loss_epoch=-1.48]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.36, train_loss_epoch=-1.80]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.11, train_loss_epoch=-1.83]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.64, train_loss_epoch=-1.78]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.12, train_loss_epoch=-1.91]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.78, train_loss_epoch=-1.87]
Epoch 7:   0%|          | 0/

2024-11-12 18:42:21,310	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=10824)[0m `Trainer.fit` stopped: `max_steps=1300.0` reached.


[36m(_train_tune pid=10824)[0m 
[36m(_train_tune pid=10824)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:00<00:00, 15.64it/s][A
[36m(_train_tune pid=10824)[0m                                                                       [AEpoch 324: 100%|██████████| 4/4 [00:00<00:00,  6.32it/s, v_num=0, train_loss_step=-2.58, train_loss_epoch=-2.21, valid_loss=-2.05]Epoch 324: 100%|██████████| 4/4 [00:00<00:00,  6.31it/s, v_num=0, train_loss_step=-2.58, train_loss_epoch=-2.24, valid_loss=-2.05]Epoch 324: 100%|██████████| 4/4 [00:00<00:00,  6.30it/s, v_num=0, train_loss_step=-2.58, train_loss_epoch=-2.24, valid_loss=-2.05]


[36m(_train_tune pid=11343)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=11343)[0m Seed set to 42
[36m(_train_tune pid=11343)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=11343)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=11343)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=11343)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=11343)[0m 2024-11-12 18:42:29.153289: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.44, train_loss_epoch=-1.50]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.18, train_loss_epoch=-1.62]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.91, train_loss_epoch=-1.62]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=-1.56]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.02, train_loss_epoch=-1.69]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.57, train_loss_epoch=-1.67]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.78, train_loss_epoch=-1.74]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.58, train_loss_epoch=-1.75]
Epoch 9: 

2024-11-12 18:43:28,861	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (2, 2, 2), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=11343)[0m 
[36m(_train_tune pid=11343)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:00<00:00, 31.46it/s][A
[36m(_train_tune pid=11343)[0m 
[36m(_train_tune pid=11343)[0m                                                                       [AEpoch 214:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.17, train_loss_epoch=-2.12, valid_loss=-1.99]Epoch 214:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.17, train_loss_epoch=-2.10, valid_loss=-1.99]Epoch 214:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.17, train_loss_epoch=-2.10, valid_loss=-1.99]


[36m(_train_tune pid=11343)[0m `Trainer.fit` stopped: `max_steps=1500.0` reached.
[36m(_train_tune pid=11686)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=11686)[0m Seed set to 42
[36m(_train_tune pid=11686)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=11686)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=11686)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=11686)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.56, train_loss_epoch=-0.888]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.31, train_loss_epoch=-1.75]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.09, train_loss_epoch=-1.82]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.82]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.13, train_loss_epoch=-1.90]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.87, train_loss_epoch=-1.87]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.00, train_loss_epoch=-1.93]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.80, train_loss_epoch=-1.89]
Epoch 9:

[36m(_train_tune pid=11686)[0m `Trainer.fit` stopped: `max_steps=1500.0` reached.
2024-11-12 18:44:32,708	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=11686)[0m 
[36m(_train_tune pid=11686)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:00<00:00, 29.22it/s][A
[36m(_train_tune pid=11686)[0m 
[36m(_train_tune pid=11686)[0m                                                                       [AEpoch 214:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.19, train_loss_epoch=-2.19, valid_loss=-1.99]
[36m(_train_tune pid=11686)[0m Epoch 214:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.19, train_loss_epoch=-2.15, valid_loss=-1.99]Epoch 214:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.19, train_loss_epoch=-2.15, valid_loss=-1.99]


[36m(_train_tune pid=12013)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=12013)[0m Seed set to 42
[36m(_train_tune pid=12013)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=12013)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=12013)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=12013)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=12013)[0m 2024-11-12 18:44:41.182293: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.44, train_loss_epoch=-0.126]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.24, train_loss_epoch=-1.70]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-1.75]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.64, train_loss_epoch=-1.77]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.13, train_loss_epoch=-1.87]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.84]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.89]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.63, train_loss_epoch=-1.81]
Epoch 9:

[36m(_train_tune pid=12013)[0m `Trainer.fit` stopped: `max_steps=1400.0` reached.
2024-11-12 18:46:14,624	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (8, 4, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=12013)[0m 
[36m(_train_tune pid=12013)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.70it/s][A
[36m(_train_tune pid=12013)[0m                                                                       [AEpoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.14it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-2.08, valid_loss=-2.06]Epoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.13it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-2.06, valid_loss=-2.06]Epoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.13it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-2.06, valid_loss=-2.06]


[36m(_train_tune pid=12495)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=12495)[0m Seed set to 42
[36m(_train_tune pid=12495)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=12495)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=12495)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=12495)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=12495)[0m 2024-11-12 18:46:23.522018: I t

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
                                                                           
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.68, train_loss_epoch=-1.50]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.39, train_loss_epoch=-1.82]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.15, train_loss_epoch=-1.88]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.72, train_loss_epoch=-1.88]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.17, train_loss_epoch=-1.96]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.87, train_loss_epoch=-1.91]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-1.97]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.82, train_lo

[36m(_train_tune pid=12495)[0m `Trainer.fit` stopped: `max_steps=1400.0` reached.
2024-11-12 18:47:15,999	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (2, 2, 2), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=12495)[0m 
[36m(_train_tune pid=12495)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:00<00:00, 27.58it/s][A
[36m(_train_tune pid=12495)[0m                                                                       [AEpoch 199: 100%|██████████| 7/7 [00:00<00:00, 13.48it/s, v_num=0, train_loss_step=-1.91, train_loss_epoch=-2.22, valid_loss=-2.01]Epoch 199: 100%|██████████| 7/7 [00:00<00:00, 13.46it/s, v_num=0, train_loss_step=-1.91, train_loss_epoch=-2.18, valid_loss=-2.01]Epoch 199: 100%|██████████| 7/7 [00:00<00:00, 13.43it/s, v_num=0, train_loss_step=-1.91, train_loss_epoch=-2.18, valid_loss=-2.01]


[36m(_train_tune pid=12811)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=12811)[0m Seed set to 42
[36m(_train_tune pid=12811)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=12811)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=12811)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=12811)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=12811)[0m 2024-11-12 18:47:24.399726: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:02<00:00,  0.82it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.33, train_loss_epoch=-1.33]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.04, train_loss_epoch=-1.62]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.78, train_loss_epoch=-1.61]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.38, train_loss_epoch=-1.55]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.68]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.55, train_loss_epoch=-1.66]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.86, train_loss_epoch=-1.80]
Epoch 8:   0%|          | 0/4 [00:00

[36m(_train_tune pid=12811)[0m `Trainer.fit` stopped: `max_steps=1400.0` reached.
2024-11-12 18:50:00,910	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (8, 4, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=12811)[0m 
[36m(_train_tune pid=12811)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:01<00:00,  2.03it/s][A
[36m(_train_tune pid=12811)[0m                                                                       [AEpoch 349: 100%|██████████| 4/4 [00:02<00:00,  1.65it/s, v_num=0, train_loss_step=-1.97, train_loss_epoch=-2.00, valid_loss=-2.05]Epoch 349: 100%|██████████| 4/4 [00:02<00:00,  1.65it/s, v_num=0, train_loss_step=-1.97, train_loss_epoch=-2.00, valid_loss=-2.05]Epoch 349: 100%|██████████| 4/4 [00:02<00:00,  1.65it/s, v_num=0, train_loss_step=-1.97, train_loss_epoch=-2.00, valid_loss=-2.05]


[36m(_train_tune pid=13559)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=13559)[0m Seed set to 42
[36m(_train_tune pid=13559)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=13559)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=13559)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=13559)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=13559)[0m 2024-11-12 18:50:09.452626: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/2 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.53, train_loss_epoch=-1.55]
Epoch 1: 100%|██████████| 2/2 [00:00<00:00,  7.22it/s, v_num=0, train_loss_step=-1.55, train_loss_epoch=-1.55]
Epoch 2:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.55, train_loss_epoch=-1.50]
Epoch 3:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.59, train_loss_epoch=-1.58]
Epoch 4:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.52, train_loss_epoch=-1.50]
Epoch 5:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.53, train_loss_epoch=-1.56]
Epoch 6:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.58, train_loss_epoch=-1.55]
Epoch 7:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.54, train_loss_epoch=-1.52]
E

2024-11-12 18:52:29,366	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (8, 4, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=13559)[0m `Trainer.fit` stopped: `max_steps=1100.0` reached.


[36m(_train_tune pid=13559)[0m 
[36m(_train_tune pid=13559)[0m Validation DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 11.40it/s][A
[36m(_train_tune pid=13559)[0m                                                                       [AEpoch 549: 100%|██████████| 2/2 [00:00<00:00,  3.62it/s, v_num=0, train_loss_step=-2.15, train_loss_epoch=-2.11, valid_loss=-1.97]Epoch 549: 100%|██████████| 2/2 [00:00<00:00,  3.60it/s, v_num=0, train_loss_step=-2.15, train_loss_epoch=-2.08, valid_loss=-1.97]Epoch 549: 100%|██████████| 2/2 [00:00<00:00,  3.59it/s, v_num=0, train_loss_step=-2.15, train_loss_epoch=-2.08, valid_loss=-1.97]


[36m(_train_tune pid=14236)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=14236)[0m Seed set to 42
[36m(_train_tune pid=14236)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=14236)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=14236)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=14236)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=14236)[0m 2024-11-12 18:52:37.274202: I t

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.64, train_loss_epoch=-1.07]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.35, train_loss_epoch=-1.79]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.17, train_loss_epoch=-1.84]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.74, train_loss_epoch=-1.85]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.13, train_loss_epoch=-1.91]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.85, train_loss_epoch=-1.86]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.02, train_loss_epoch=-1.93]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.75, train_loss_epoch=-1.89]
Epoch 9:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, trai

[36m(_train_tune pid=14236)[0m `Trainer.fit` stopped: `max_steps=1500.0` reached.
2024-11-12 18:53:34,055	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (8, 4, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
2024-11-12 18:53:34,080	INFO tune.py:1009 -- Wrote the latest version of all result files and experiment state to '/root/ray_results/_train_tune_2024-11-12_18-17-38' in 0.0211s.
2024-11-12 18:53:34,084	ERROR tune.py:1037 -- Trials did not complete: [_train_tune_5c12a5b4, _train_tune_8be5387b, _train_tune_a6b09eb8]
INFO:lightning_fabric.utilities.seed:Seed set to 42
INFO:pytorch_lightning.utilities.rank_zero:GPU available: True (cuda), used: True
INFO:pytorch_lightning.utilities.rank_zero:TPU available: False, using: 0 TPU cores
INFO:pytorch_lightning.utilities.rank_zero:HPU available: False, using: 0 HPUs
INFO:pytorch_lightning.utilities.ra

[36m(_train_tune pid=14236)[0m 
[36m(_train_tune pid=14236)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:00<00:00, 27.31it/s][A
[36m(_train_tune pid=14236)[0m                                                                       [AEpoch 214:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.20, train_loss_epoch=-2.19, valid_loss=-1.99]
[36m(_train_tune pid=14236)[0m Epoch 214:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.20, train_loss_epoch=-2.16, valid_loss=-1.99]Epoch 214:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.20, train_loss_epoch=-2.16, valid_loss=-1.99]



INFO:pytorch_lightning.accelerators.cuda:LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
INFO:pytorch_lightning.callbacks.model_summary:
  | Name         | Type             | Params | Mode 
----------------------------------------------------------
0 | loss         | DistributionLoss | 3      | eval 
1 | padder_train | ConstantPad1d    | 0      | train
2 | scaler       | TemporalNorm     | 0      | train
3 | blocks       | ModuleList       | 2.6 M  | train
----------------------------------------------------------
2.6 M     Trainable params
3         Non-trainable params
2.6 M     Total params
10.495    Total estimated model params size (MB)
33        Modules in train mode
1         Modules in eval mode


Sanity Checking: |          | 0/? [00:00<?, ?it/s]

Training: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

INFO:pytorch_lightning.utilities.rank_zero:`Trainer.fit` stopped: `max_steps=1400.0` reached.
INFO:pytorch_lightning.utilities.rank_zero:GPU available: True (cuda), used: True
INFO:pytorch_lightning.utilities.rank_zero:TPU available: False, using: 0 TPU cores
INFO:pytorch_lightning.utilities.rank_zero:HPU available: False, using: 0 HPUs
INFO:pytorch_lightning.accelerators.cuda:LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]


Predicting: |          | 0/? [00:00<?, ?it/s]

+--------------------------------------------------------------------+
| Configuration for experiment     _train_tune_2024-11-12_18-54-39   |
+--------------------------------------------------------------------+
| Search algorithm                 SearchGenerator                   |
| Scheduler                        FIFOScheduler                     |
| Number of trials                 30                                |
+--------------------------------------------------------------------+

View detailed results here: /root/ray_results/_train_tune_2024-11-12_18-54-39
To visualize your results with TensorBoard, run: `tensorboard --logdir /tmp/ray/session_2024-11-12_18-17-38_352630_2326/artifacts/2024-11-12_18-54-39/_train_tune_2024-11-12_18-54-39/driver_artifacts`


[36m(_train_tune pid=14842)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=14842)[0m Seed set to 42
[36m(_train_tune pid=14842)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=14842)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=14842)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=14842)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=14842)[0m 2024-11-12 18:54:46.822824: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
                                                                           
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.36, train_loss_epoch=-1.44]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.02, train_loss_epoch=-1.56]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.78, train_loss_epoch=-1.56]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.41, train_loss_epoch=-1.43]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.97, train_loss_epoch=-1.58]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.36, train_loss_epoch=-1.50]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.57, train_loss_epoch=-1.51]
Epoch 8:   0%|          | 0/4 [00:00

2024-11-12 18:56:46,348	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (24, 12, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=14842)[0m `Trainer.fit` stopped: `max_steps=1100.0` reached.


[36m(_train_tune pid=14842)[0m 
[36m(_train_tune pid=14842)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:02<00:00,  1.99it/s][A
[36m(_train_tune pid=14842)[0m                                                                       [AEpoch 274: 100%|██████████| 4/4 [00:02<00:00,  1.65it/s, v_num=0, train_loss_step=-1.32, train_loss_epoch=-1.87, valid_loss=-1.98]Epoch 274: 100%|██████████| 4/4 [00:02<00:00,  1.65it/s, v_num=0, train_loss_step=-1.32, train_loss_epoch=-1.83, valid_loss=-1.98]Epoch 274: 100%|██████████| 4/4 [00:02<00:00,  1.65it/s, v_num=0, train_loss_step=-1.32, train_loss_epoch=-1.83, valid_loss=-1.98]


[36m(_train_tune pid=15431)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=15431)[0m Seed set to 42
[36m(_train_tune pid=15431)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=15431)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=15431)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=15431)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=15431)[0m 2024-11-12 18:56:54.353167: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


2024-11-12 18:56:58,606	ERROR tune_controller.py:1331 -- Trial task failed for trial _train_tune_be5546d3
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/ray/air/execution/_internal/event_manager.py", line 110, in resolve_future
    result = ray.get(future)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/auto_init_hook.py", line 21, in auto_init_wrapper
    return fn(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/client_mode_hook.py", line 103, in wrapper
    return func(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 2745, in get
    values, debugger_breakpoint = worker.get_objects(object_refs, timeout=timeout)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 901, in get_objects
    raise value.as_instanceof_cause()
ray.exceptions.RayTaskError(OutOfMemoryError): [36mray::ImplicitFunc.train()[39m (pid=15431, ip=172.28.0.12, actor_i


Trial _train_tune_be5546d3 errored after 0 iterations at 2024-11-12 18:56:58. Total running time: 2min 19s
Error file: /tmp/ray/session_2024-11-12_18-17-38_352630_2326/artifacts/2024-11-12_18-54-39/_train_tune_2024-11-12_18-54-39/driver_artifacts/_train_tune_be5546d3_2_batch_size=256,h=20,hist_exog_list=MA_2_9_MA_3_9_MA_1_12_MA_2_12_MA_3_12_MOM_9_MOM_12_RSI_7_RSI_14_EMA_3_9__2024-11-12_18-54-46/error.txt


[36m(_train_tune pid=15539)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=15539)[0m Seed set to 42
[36m(_train_tune pid=15539)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=15539)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=15539)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=15539)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=15539)[0m 2024-11-12 18:57:06.389371: I t

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.24, train_loss_epoch=-1.26]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.85, train_loss_epoch=-1.33]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.83, train_loss_epoch=-1.35]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.28, train_loss_epoch=-1.35]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.81, train_loss_epoch=-1.40]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.24, train_loss_epoch=-1.38]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.08, train_loss_epoch=-1.38]
[36m(_train_tune pid=15539)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
Validation DataLoa

2024-11-12 18:57:44,917	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (180, 60, 1), 'n_pool_kernel_size': (8, 4, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=15539)[0m `Trainer.fit` stopped: `max_steps=700.0` reached.


[36m(_train_tune pid=15539)[0m 
[36m(_train_tune pid=15539)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:02<00:00,  6.40it/s][A
[36m(_train_tune pid=15539)[0m                                                                         [AEpoch 53:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.73, train_loss_epoch=-1.70, valid_loss=-1.70]Epoch 53:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.73, train_loss_epoch=-1.69, valid_loss=-1.70]Epoch 53:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.73, train_loss_epoch=-1.69, valid_loss=-1.70]


[36m(_train_tune pid=15796)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=15796)[0m Seed set to 42
[36m(_train_tune pid=15796)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=15796)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=15796)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=15796)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=15796)[0m 2024-11-12 18:57:53.346085: I t

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.26, train_loss_epoch=-1.19]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.98, train_loss_epoch=-1.47]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.89, train_loss_epoch=-1.54]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=-1.56]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.03, train_loss_epoch=-1.60]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.46, train_loss_epoch=-1.64]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.48, train_loss_epoch=-1.65]
[36m(_train_tune pid=15796)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
Validation DataLoa

[36m(_train_tune pid=15796)[0m `Trainer.fit` stopped: `max_steps=600.0` reached.
2024-11-12 18:58:26,590	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (1, 1, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=15796)[0m 
[36m(_train_tune pid=15796)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:02<00:00,  6.38it/s][A
[36m(_train_tune pid=15796)[0m                                                                         [AEpoch 46:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.89, train_loss_epoch=-1.91, valid_loss=-1.85]Epoch 46:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.89, train_loss_epoch=-1.84, valid_loss=-1.85]Epoch 46:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.89, train_loss_epoch=-1.84, valid_loss=-1.85]


[36m(_train_tune pid=16026)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=16026)[0m Seed set to 42
[36m(_train_tune pid=16026)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=16026)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=16026)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=16026)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=16026)[0m 2024-11-12 18:58:34.316626: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.22, train_loss_epoch=-1.45]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.86, train_loss_epoch=-1.57]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.94, train_loss_epoch=-1.48]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.33, train_loss_epoch=-1.55]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.86, train_loss_epoch=-1.60]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.55, train_loss_epoch=-1.62]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.83, train_loss_epoch=-1.65]
[36m(_train_tune pid=16026)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|    

[36m(_train_tune pid=16026)[0m `Trainer.fit` stopped: `max_steps=1400.0` reached.
2024-11-12 18:59:43,885	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=16026)[0m 
[36m(_train_tune pid=16026)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:01<00:00,  6.96it/s][A
[36m(_train_tune pid=16026)[0m                                                                         [AEpoch 107:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.74, train_loss_epoch=-1.88, valid_loss=-1.91]Epoch 107:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.74, train_loss_epoch=-1.91, valid_loss=-1.91]Epoch 107:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.74, train_loss_epoch=-1.91, valid_loss=-1.91]


[36m(_train_tune pid=16408)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=16408)[0m Seed set to 42
[36m(_train_tune pid=16408)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=16408)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=16408)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=16408)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=16408)[0m 2024-11-12 18:59:52.352041: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


2024-11-12 18:59:56,366	ERROR tune_controller.py:1331 -- Trial task failed for trial _train_tune_e2f48f06
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/ray/air/execution/_internal/event_manager.py", line 110, in resolve_future
    result = ray.get(future)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/auto_init_hook.py", line 21, in auto_init_wrapper
    return fn(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/client_mode_hook.py", line 103, in wrapper
    return func(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 2745, in get
    values, debugger_breakpoint = worker.get_objects(object_refs, timeout=timeout)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 901, in get_objects
    raise value.as_instanceof_cause()
ray.exceptions.RayTaskError(OutOfMemoryError): [36mray::ImplicitFunc.train()[39m (pid=16408, ip=172.28.0.12, actor_i


Trial _train_tune_e2f48f06 errored after 0 iterations at 2024-11-12 18:59:56. Total running time: 5min 17s
Error file: /tmp/ray/session_2024-11-12_18-17-38_352630_2326/artifacts/2024-11-12_18-54-39/_train_tune_2024-11-12_18-54-39/driver_artifacts/_train_tune_e2f48f06_6_batch_size=256,h=20,hist_exog_list=MA_2_9_MA_3_9_MA_1_12_MA_2_12_MA_3_12_MOM_9_MOM_12_RSI_7_RSI_14_EMA_3_9__2024-11-12_18-58-33/error.txt


[36m(_train_tune pid=16516)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=16516)[0m Seed set to 42
[36m(_train_tune pid=16516)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=16516)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=16516)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=16516)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=16516)[0m 2024-11-12 19:00:04.286119: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=9.570, train_loss_epoch=26.90]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=9.800, train_loss_epoch=10.10]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=10.70, train_loss_epoch=10.70]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=10.00, train_loss_epoch=10.60]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=10.10, train_loss_epoch=10.30]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=9.730, train_loss_epoch=9.770]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=9.220, train_loss_epoch=9.420]
Epoch 8:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=9.900, train_loss_epoch=9.840]
Epoch 9: 

2024-11-12 19:00:49,666	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=16516)[0m `Trainer.fit` stopped: `max_steps=600.0` reached.


[36m(_train_tune pid=16516)[0m 
[36m(_train_tune pid=16516)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:00<00:00, 16.19it/s][A
[36m(_train_tune pid=16516)[0m                                                                       [AEpoch 149: 100%|██████████| 4/4 [00:00<00:00,  6.84it/s, v_num=0, train_loss_step=7.460, train_loss_epoch=7.760, valid_loss=7.200]Epoch 149: 100%|██████████| 4/4 [00:00<00:00,  6.83it/s, v_num=0, train_loss_step=7.460, train_loss_epoch=7.480, valid_loss=7.200]Epoch 149: 100%|██████████| 4/4 [00:00<00:00,  6.81it/s, v_num=0, train_loss_step=7.460, train_loss_epoch=7.480, valid_loss=7.200]


[36m(_train_tune pid=16797)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=16797)[0m Seed set to 42
[36m(_train_tune pid=16797)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=16797)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=16797)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=16797)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=16797)[0m 2024-11-12 19:00:57.276937: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.0677, train_loss_epoch=-0.0514]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.31, train_loss_epoch=-0.543]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.811, train_loss_epoch=-0.522]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.227, train_loss_epoch=-0.401]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.18, train_loss_epoch=-0.802]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.443, train_loss_epoch=-0.577]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.592, train_loss_epoch=-0.732]
Epoch 8:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.426, train_loss_epoch=-

2024-11-12 19:02:46,415	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=16797)[0m `Trainer.fit` stopped: `max_steps=1000.0` reached.


[36m(_train_tune pid=16797)[0m 
[36m(_train_tune pid=16797)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:02<00:00,  1.73it/s][A
[36m(_train_tune pid=16797)[0m                                                                       [AEpoch 249: 100%|██████████| 4/4 [00:02<00:00,  1.48it/s, v_num=0, train_loss_step=-1.96, train_loss_epoch=-1.81, valid_loss=-1.65]Epoch 249: 100%|██████████| 4/4 [00:02<00:00,  1.48it/s, v_num=0, train_loss_step=-1.96, train_loss_epoch=-1.74, valid_loss=-1.65]Epoch 249: 100%|██████████| 4/4 [00:02<00:00,  1.48it/s, v_num=0, train_loss_step=-1.96, train_loss_epoch=-1.74, valid_loss=-1.65]


[36m(_train_tune pid=17345)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=17345)[0m Seed set to 42
[36m(_train_tune pid=17345)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=17345)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=17345)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=17345)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=17345)[0m 2024-11-12 19:02:54.445855: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.825, train_loss_epoch=-0.755]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.29, train_loss_epoch=-0.939]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.52, train_loss_epoch=-1.12]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.16, train_loss_epoch=-1.22]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.70, train_loss_epoch=-1.35]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.11, train_loss_epoch=-1.21]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.12, train_loss_epoch=-1.24]
Epoch 7: 100%|██████████| 4/4 [00:00<00:00, 10.94it/s, v_num=0, train_loss_step=-1.13, train_loss_epoch=-1.24

2024-11-12 19:05:29,397	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (24, 12, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=17345)[0m `Trainer.fit` stopped: `max_steps=1300.0` reached.


[36m(_train_tune pid=17345)[0m 
[36m(_train_tune pid=17345)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:02<00:00,  1.85it/s][A
[36m(_train_tune pid=17345)[0m                                                                       [AEpoch 324: 100%|██████████| 4/4 [00:02<00:00,  1.51it/s, v_num=0, train_loss_step=-2.32, train_loss_epoch=-1.97, valid_loss=-1.92]Epoch 324: 100%|██████████| 4/4 [00:02<00:00,  1.51it/s, v_num=0, train_loss_step=-2.32, train_loss_epoch=-2.03, valid_loss=-1.92]Epoch 324: 100%|██████████| 4/4 [00:02<00:00,  1.51it/s, v_num=0, train_loss_step=-2.32, train_loss_epoch=-2.03, valid_loss=-1.92]


[36m(_train_tune pid=18081)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=18081)[0m Seed set to 42
[36m(_train_tune pid=18081)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=18081)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=18081)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=18081)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=18081)[0m 2024-11-12 19:05:37.391545: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=16.40, train_loss_epoch=14.70]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=7.56e+5, train_loss_epoch=5.82e+4]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=17.30, train_loss_epoch=21.10]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=11.50, train_loss_epoch=13.50]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=11.10, train_loss_epoch=11.70]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=12.20, train_loss_epoch=28.10]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=11.20, train_loss_epoch=12.50]
[36m(_train_tune pid=18081)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|

2024-11-12 19:06:42,345	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (2, 2, 2), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=18081)[0m `Trainer.fit` stopped: `max_steps=1400.0` reached.


[36m(_train_tune pid=18081)[0m 
[36m(_train_tune pid=18081)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:01<00:00,  7.35it/s][A
[36m(_train_tune pid=18081)[0m                                                                         [AEpoch 107:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.14, train_loss_epoch=-1.11, valid_loss=-0.904] Epoch 107:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.14, train_loss_epoch=-1.16, valid_loss=-0.904]Epoch 107:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.14, train_loss_epoch=-1.16, valid_loss=-0.904]


[36m(_train_tune pid=18446)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=18446)[0m Seed set to 42
[36m(_train_tune pid=18446)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=18446)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=18446)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=18446)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=18446)[0m 2024-11-12 19:06:50.500631: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.52, train_loss_epoch=-1.43]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.21, train_loss_epoch=-1.62]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.02, train_loss_epoch=-1.65]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.55, train_loss_epoch=-1.74]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.07, train_loss_epoch=-1.80]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.73]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.78, train_loss_epoch=-1.77]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.53, train_loss_epoch=-1.78]
Epoch 9: 

2024-11-12 19:07:32,939	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=18446)[0m `Trainer.fit` stopped: `max_steps=1100.0` reached.


[36m(_train_tune pid=18446)[0m 
[36m(_train_tune pid=18446)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:00<00:00, 29.97it/s][A
[36m(_train_tune pid=18446)[0m                                                                       [AEpoch 157:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.15, train_loss_epoch=-2.17, valid_loss=-1.92]Epoch 157:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.15, train_loss_epoch=-2.15, valid_loss=-1.92]Epoch 157:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.15, train_loss_epoch=-2.15, valid_loss=-1.92]


[36m(_train_tune pid=18717)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=18717)[0m Seed set to 42
[36m(_train_tune pid=18717)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=18717)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=18717)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=18717)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=18717)[0m 2024-11-12 19:07:41.421996: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=7.410, train_loss_epoch=17.60]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=5.370, train_loss_epoch=6.810]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=5.910, train_loss_epoch=6.110]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=4.730, train_loss_epoch=5.580]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=5.660, train_loss_epoch=5.700]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=5.960, train_loss_epoch=5.750]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=3.820, train_loss_epoch=5.300]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=4.800, train_loss_epoch=5.330]
Epoch 9: 

2024-11-12 19:09:03,597	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (1, 1, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=18717)[0m `Trainer.fit` stopped: `max_steps=1300.0` reached.


[36m(_train_tune pid=18717)[0m 
[36m(_train_tune pid=18717)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:02<00:00,  3.30it/s][A
[36m(_train_tune pid=18717)[0m                                                                       [AEpoch 185:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=2.590, train_loss_epoch=2.520, valid_loss=2.490]Epoch 185:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=2.590, train_loss_epoch=2.660, valid_loss=2.490]Epoch 185:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=2.590, train_loss_epoch=2.660, valid_loss=2.490]


[36m(_train_tune pid=19156)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=19156)[0m Seed set to 42
[36m(_train_tune pid=19156)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=19156)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=19156)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=19156)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=19156)[0m 2024-11-12 19:09:11.545461: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/2 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.45, train_loss_epoch=-1.52]
Epoch 2:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.38, train_loss_epoch=-1.40]
Epoch 3:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.53, train_loss_epoch=-1.47]
Epoch 4:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.48, train_loss_epoch=-1.51]
Epoch 5:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.41, train_loss_epoch=-1.46]
Epoch 6:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.45, train_loss_epoch=-1.46]
Epoch 7:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.60, train_loss_epoch=-1.53]
Epoch 8:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.56, train_loss_epoch=-1.56]
Epoch 9: 

2024-11-12 19:10:40,519	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (180, 60, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=19156)[0m 
[36m(_train_tune pid=19156)[0m Validation:   0%|          | 0/2 [00:00<?, ?it/s][A
[36m(_train_tune pid=19156)[0m Validation DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s][A


[36m(_train_tune pid=19156)[0m `Trainer.fit` stopped: `max_steps=600.0` reached.


[36m(_train_tune pid=19156)[0m 
[36m(_train_tune pid=19156)[0m Validation DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 10.84it/s][A
[36m(_train_tune pid=19156)[0m                                                                       [AEpoch 299: 100%|██████████| 2/2 [00:00<00:00,  3.33it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-2.03, valid_loss=-1.86]Epoch 299: 100%|██████████| 2/2 [00:00<00:00,  3.31it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.98, valid_loss=-1.86]Epoch 299: 100%|██████████| 2/2 [00:00<00:00,  3.31it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.98, valid_loss=-1.86]


[36m(_train_tune pid=19619)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=19619)[0m Seed set to 42
[36m(_train_tune pid=19619)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=19619)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=19619)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=19619)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=19619)[0m 2024-11-12 19:10:48.469062: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


2024-11-12 19:10:51,903	ERROR tune_controller.py:1331 -- Trial task failed for trial _train_tune_65a60f7c
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/ray/air/execution/_internal/event_manager.py", line 110, in resolve_future
    result = ray.get(future)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/auto_init_hook.py", line 21, in auto_init_wrapper
    return fn(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/client_mode_hook.py", line 103, in wrapper
    return func(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 2745, in get
    values, debugger_breakpoint = worker.get_objects(object_refs, timeout=timeout)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 901, in get_objects
    raise value.as_instanceof_cause()
ray.exceptions.RayTaskError(OutOfMemoryError): [36mray::ImplicitFunc.train()[39m (pid=19619, ip=172.28.0.12, actor_i


Trial _train_tune_65a60f7c errored after 0 iterations at 2024-11-12 19:10:51. Total running time: 16min 12s
Error file: /tmp/ray/session_2024-11-12_18-17-38_352630_2326/artifacts/2024-11-12_18-54-39/_train_tune_2024-11-12_18-54-39/driver_artifacts/_train_tune_65a60f7c_14_batch_size=256,h=20,hist_exog_list=MA_2_9_MA_3_9_MA_1_12_MA_2_12_MA_3_12_MOM_9_MOM_12_RSI_7_RSI_14_EMA_3_9_2024-11-12_19-09-10/error.txt


[36m(_train_tune pid=19723)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=19723)[0m Seed set to 42
[36m(_train_tune pid=19723)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=19723)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=19723)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=19723)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=19723)[0m 2024-11-12 19:10:59.449016: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=13.10, train_loss_epoch=11.40]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=13.60, train_loss_epoch=6.01e+4]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=15.70, train_loss_epoch=15.30]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=29.20, train_loss_epoch=28.90]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=30.90, train_loss_epoch=30.40]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=19.90, train_loss_epoch=24.70]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=18.90, train_loss_epoch=19.70]
Epoch 8:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=20.10, train_loss_epoch=20.40]
Epoch 9

2024-11-12 19:12:26,650	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (24, 12, 1), 'n_pool_kernel_size': (2, 2, 2), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=19723)[0m `Trainer.fit` stopped: `max_steps=1100.0` reached.


[36m(_train_tune pid=19723)[0m 
[36m(_train_tune pid=19723)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:00<00:00, 15.29it/s][A
[36m(_train_tune pid=19723)[0m                                                                       [AEpoch 274: 100%|██████████| 4/4 [00:00<00:00,  6.09it/s, v_num=0, train_loss_step=9.820, train_loss_epoch=9.670, valid_loss=9.150]Epoch 274: 100%|██████████| 4/4 [00:00<00:00,  6.08it/s, v_num=0, train_loss_step=9.820, train_loss_epoch=9.540, valid_loss=9.150]Epoch 274: 100%|██████████| 4/4 [00:00<00:00,  6.07it/s, v_num=0, train_loss_step=9.820, train_loss_epoch=9.540, valid_loss=9.150]


[36m(_train_tune pid=20179)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=20179)[0m Seed set to 42
[36m(_train_tune pid=20179)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=20179)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=20179)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=20179)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=20179)[0m 2024-11-12 19:12:34.467402: I t

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.50, train_loss_epoch=-1.31]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.21, train_loss_epoch=-1.57]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.59]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.51, train_loss_epoch=-1.61]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.00, train_loss_epoch=-1.67]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.59, train_loss_epoch=-1.67]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.64, train_loss_epoch=-1.68]
[36m(_train_tune pid=20179)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
Validation DataLoa

2024-11-12 19:12:57,559	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (1, 1, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=20179)[0m `Trainer.fit` stopped: `max_steps=700.0` reached.


[36m(_train_tune pid=20179)[0m 
[36m(_train_tune pid=20179)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 45.14it/s][A
[36m(_train_tune pid=20179)[0m                                                                         [AEpoch 53:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.97, train_loss_epoch=-2.01, valid_loss=-1.60]Epoch 53:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.97, train_loss_epoch=-2.00, valid_loss=-1.60]Epoch 53:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.97, train_loss_epoch=-2.00, valid_loss=-1.60]


[36m(_train_tune pid=20368)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=20368)[0m Seed set to 42
[36m(_train_tune pid=20368)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=20368)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=20368)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=20368)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=20368)[0m 2024-11-12 19:13:05.521238: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/2 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=2.720, train_loss_epoch=0.747]
Epoch 2:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=4.210, train_loss_epoch=5.440]
Epoch 3:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=3.480, train_loss_epoch=4.030]
Epoch 4:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=3.650, train_loss_epoch=3.390]
Epoch 5:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=3.660, train_loss_epoch=3.730]
Epoch 6:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=2.690, train_loss_epoch=2.810]
Epoch 7:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=2.430, train_loss_epoch=2.990]
Epoch 8:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=3.140, train_loss_epoch=3.110]
Epoch 8: 

[36m(_train_tune pid=20368)[0m `Trainer.fit` stopped: `max_steps=500.0` reached.
2024-11-12 19:14:23,989	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (1, 1, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=20368)[0m 
[36m(_train_tune pid=20368)[0m Validation DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 10.24it/s][A
[36m(_train_tune pid=20368)[0m                                                                       [AEpoch 249: 100%|██████████| 2/2 [00:00<00:00,  3.11it/s, v_num=0, train_loss_step=-1.68, train_loss_epoch=-1.64, valid_loss=-1.58]Epoch 249: 100%|██████████| 2/2 [00:00<00:00,  3.09it/s, v_num=0, train_loss_step=-1.68, train_loss_epoch=-1.70, valid_loss=-1.58]Epoch 249: 100%|██████████| 2/2 [00:00<00:00,  3.08it/s, v_num=0, train_loss_step=-1.68, train_loss_epoch=-1.70, valid_loss=-1.58]


[36m(_train_tune pid=20786)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=20786)[0m Seed set to 42
[36m(_train_tune pid=20786)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=20786)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=20786)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=20786)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=20786)[0m 2024-11-12 19:14:32.490515: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.38, train_loss_epoch=-1.41]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.03, train_loss_epoch=-1.54]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.77, train_loss_epoch=-1.59]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.42, train_loss_epoch=-1.58]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.07, train_loss_epoch=-1.69]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.74, train_loss_epoch=-1.71]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-1.81]
[36m(_train_tune pid=20786)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|    

2024-11-12 19:15:44,809	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (24, 12, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=20786)[0m `Trainer.fit` stopped: `max_steps=1500.0` reached.


[36m(_train_tune pid=20786)[0m 
[36m(_train_tune pid=20786)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:01<00:00,  7.09it/s][A
[36m(_train_tune pid=20786)[0m                                                                         [AEpoch 115:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.03, train_loss_epoch=-1.98, valid_loss=-1.95]Epoch 115:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.03, train_loss_epoch=-1.98, valid_loss=-1.95]Epoch 115:   0%|          | 0/13 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.03, train_loss_epoch=-1.98, valid_loss=-1.95]


[36m(_train_tune pid=21180)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=21180)[0m Seed set to 42
[36m(_train_tune pid=21180)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=21180)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=21180)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=21180)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=21180)[0m 2024-11-12 19:15:52.535556: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=7.940, train_loss_epoch=10.60]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=6.850, train_loss_epoch=7.810]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=7.010, train_loss_epoch=7.120]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=6.540, train_loss_epoch=6.840]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=7.550, train_loss_epoch=7.660]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=7.000, train_loss_epoch=7.170]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=4.960, train_loss_epoch=6.190]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=7.240, train_loss_epoch=7.530]
Epoch 9: 

2024-11-12 19:16:36,799	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (24, 12, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=21180)[0m `Trainer.fit` stopped: `max_steps=700.0` reached.


[36m(_train_tune pid=21180)[0m 
[36m(_train_tune pid=21180)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.71it/s][A
[36m(_train_tune pid=21180)[0m                                                                       [AEpoch 99: 100%|██████████| 7/7 [00:02<00:00,  3.20it/s, v_num=0, train_loss_step=-0.152, train_loss_epoch=0.109, valid_loss=-0.0529]Epoch 99: 100%|██████████| 7/7 [00:02<00:00,  3.20it/s, v_num=0, train_loss_step=-0.152, train_loss_epoch=-0.0969, valid_loss=-0.0529]Epoch 99: 100%|██████████| 7/7 [00:02<00:00,  3.20it/s, v_num=0, train_loss_step=-0.152, train_loss_epoch=-0.0969, valid_loss=-0.0529]


[36m(_train_tune pid=21455)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=21455)[0m Seed set to 42
[36m(_train_tune pid=21455)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=21455)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=21455)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=21455)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=21455)[0m 2024-11-12 19:16:44.655474: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.16, train_loss_epoch=-1.20]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.73, train_loss_epoch=-1.27]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.58, train_loss_epoch=-1.23]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.10, train_loss_epoch=-1.21]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.76, train_loss_epoch=-1.38]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.17, train_loss_epoch=-1.19]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.712, train_loss_epoch=-1.16]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.12, train_loss_epoch=-1.30]
Epoch 9:

2024-11-12 19:17:31,417	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=21455)[0m 
[36m(_train_tune pid=21455)[0m Validation:   0%|          | 0/7 [00:00<?, ?it/s][A
[36m(_train_tune pid=21455)[0m Validation DataLoader 0:   0%|          | 0/7 [00:00<?, ?it/s][A


[36m(_train_tune pid=21455)[0m `Trainer.fit` stopped: `max_steps=1200.0` reached.


[36m(_train_tune pid=21455)[0m 
[36m(_train_tune pid=21455)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:00<00:00, 28.08it/s][A
[36m(_train_tune pid=21455)[0m                                                                       [AEpoch 171:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.94, train_loss_epoch=-1.82, valid_loss=-1.68]Epoch 171:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.94, train_loss_epoch=-1.84, valid_loss=-1.68]Epoch 171:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.94, train_loss_epoch=-1.84, valid_loss=-1.68]


[36m(_train_tune pid=21747)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=21747)[0m Seed set to 42
[36m(_train_tune pid=21747)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=21747)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=21747)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=21747)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=21747)[0m 2024-11-12 19:17:39.447980: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=8.310, train_loss_epoch=26.40]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=5.470, train_loss_epoch=7.060]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=6.140, train_loss_epoch=6.310]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=5.020, train_loss_epoch=6.080]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=5.690, train_loss_epoch=5.820]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=6.110, train_loss_epoch=5.780]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=4.420, train_loss_epoch=5.600]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=5.370, train_loss_epoch=5.750]
Epoch 9: 

2024-11-12 19:18:10,733	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=21747)[0m `Trainer.fit` stopped: `max_steps=800.0` reached.


[36m(_train_tune pid=21747)[0m 
[36m(_train_tune pid=21747)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:00<00:00, 27.00it/s][A
[36m(_train_tune pid=21747)[0m                                                                       [AEpoch 114:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=4.720, train_loss_epoch=4.870, valid_loss=4.680]Epoch 114:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=4.720, train_loss_epoch=4.810, valid_loss=4.680]Epoch 114:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=4.720, train_loss_epoch=4.810, valid_loss=4.680]


[36m(_train_tune pid=21972)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=21972)[0m Seed set to 42
[36m(_train_tune pid=21972)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=21972)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=21972)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=21972)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=21972)[0m 2024-11-12 19:18:18.511203: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=-1.47]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.27, train_loss_epoch=-1.71]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.07, train_loss_epoch=-1.75]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.60, train_loss_epoch=-1.75]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.10, train_loss_epoch=-1.82]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.78]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.94, train_loss_epoch=-1.86]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.65, train_loss_epoch=-1.82]
Epoch 9: 

2024-11-12 19:19:24,557	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=21972)[0m `Trainer.fit` stopped: `max_steps=900.0` reached.


[36m(_train_tune pid=21972)[0m 
[36m(_train_tune pid=21972)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.54it/s][A
[36m(_train_tune pid=21972)[0m                                                                       [AEpoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.11, valid_loss=-2.05]Epoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.14, valid_loss=-2.05]Epoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.14, valid_loss=-2.05]


[36m(_train_tune pid=22342)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=22342)[0m Seed set to 42
[36m(_train_tune pid=22342)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=22342)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=22342)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=22342)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=22342)[0m 2024-11-12 19:19:32.667907: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=8.370, train_loss_epoch=79.80]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=8.810, train_loss_epoch=9.050]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=9.940, train_loss_epoch=9.930]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=9.200, train_loss_epoch=9.850]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=9.630, train_loss_epoch=9.920]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=9.650, train_loss_epoch=9.600]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=8.470, train_loss_epoch=9.300]
Epoch 8:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=9.680, train_loss_epoch=9.890]
Epoch 9: 

[36m(_train_tune pid=22342)[0m `Trainer.fit` stopped: `max_steps=1100.0` reached.
2024-11-12 19:21:36,429	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=22342)[0m 
[36m(_train_tune pid=22342)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:01<00:00,  2.01it/s][A
[36m(_train_tune pid=22342)[0m                                                                       [AEpoch 274: 100%|██████████| 4/4 [00:02<00:00,  1.64it/s, v_num=0, train_loss_step=6.860, train_loss_epoch=6.620, valid_loss=6.160]Epoch 274: 100%|██████████| 4/4 [00:02<00:00,  1.64it/s, v_num=0, train_loss_step=6.860, train_loss_epoch=6.350, valid_loss=6.160]Epoch 274: 100%|██████████| 4/4 [00:02<00:00,  1.64it/s, v_num=0, train_loss_step=6.860, train_loss_epoch=6.350, valid_loss=6.160]


[36m(_train_tune pid=22951)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=22951)[0m Seed set to 42
[36m(_train_tune pid=22951)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=22951)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=22951)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=22951)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=22951)[0m 2024-11-12 19:21:44.560690: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.38, train_loss_epoch=-1.43]
Epoch 1: 100%|██████████| 4/4 [00:00<00:00, 12.02it/s, v_num=0, train_loss_step=-1.96, train_loss_epoch=-1.43]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.96, train_loss_epoch=-1.55]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.79, train_loss_epoch=-1.51]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.29, train_loss_epoch=-1.36]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.82, train_loss_epoch=-1.52]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.24, train_loss_epoch=-1.43]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.55, train_loss_epoch=-1.47]
E

2024-11-12 19:23:25,087	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (8, 4, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=22951)[0m `Trainer.fit` stopped: `max_steps=900.0` reached.


[36m(_train_tune pid=22951)[0m 
[36m(_train_tune pid=22951)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:02<00:00,  1.98it/s][A
[36m(_train_tune pid=22951)[0m                                                                       [AEpoch 224: 100%|██████████| 4/4 [00:02<00:00,  1.64it/s, v_num=0, train_loss_step=-0.956, train_loss_epoch=-1.84, valid_loss=-1.84]Epoch 224: 100%|██████████| 4/4 [00:02<00:00,  1.64it/s, v_num=0, train_loss_step=-0.956, train_loss_epoch=-1.60, valid_loss=-1.84]Epoch 224: 100%|██████████| 4/4 [00:02<00:00,  1.64it/s, v_num=0, train_loss_step=-0.956, train_loss_epoch=-1.60, valid_loss=-1.84]


[36m(_train_tune pid=23466)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=23466)[0m Seed set to 42
[36m(_train_tune pid=23466)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=23466)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=23466)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=23466)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=23466)[0m 2024-11-12 19:23:33.745100: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


2024-11-12 19:23:37,994	ERROR tune_controller.py:1331 -- Trial task failed for trial _train_tune_64a1c5ae
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/ray/air/execution/_internal/event_manager.py", line 110, in resolve_future
    result = ray.get(future)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/auto_init_hook.py", line 21, in auto_init_wrapper
    return fn(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/client_mode_hook.py", line 103, in wrapper
    return func(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 2745, in get
    values, debugger_breakpoint = worker.get_objects(object_refs, timeout=timeout)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 901, in get_objects
    raise value.as_instanceof_cause()
ray.exceptions.RayTaskError(OutOfMemoryError): [36mray::ImplicitFunc.train()[39m (pid=23466, ip=172.28.0.12, actor_i


Trial _train_tune_64a1c5ae errored after 0 iterations at 2024-11-12 19:23:37. Total running time: 28min 58s
Error file: /tmp/ray/session_2024-11-12_18-17-38_352630_2326/artifacts/2024-11-12_18-54-39/_train_tune_2024-11-12_18-54-39/driver_artifacts/_train_tune_64a1c5ae_25_batch_size=256,h=20,hist_exog_list=MA_2_9_MA_3_9_MA_1_12_MA_2_12_MA_3_12_MOM_9_MOM_12_RSI_7_RSI_14_EMA_3_9_2024-11-12_19-21-43/error.txt


[36m(_train_tune pid=23574)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=23574)[0m Seed set to 42
[36m(_train_tune pid=23574)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=23574)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=23574)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=23574)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=23574)[0m 2024-11-12 19:23:45.640258: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=-1.47]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.27, train_loss_epoch=-1.71]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.07, train_loss_epoch=-1.75]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.60, train_loss_epoch=-1.75]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.10, train_loss_epoch=-1.82]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.78]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.94, train_loss_epoch=-1.86]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.65, train_loss_epoch=-1.82]
Epoch 9: 

[36m(_train_tune pid=23574)[0m `Trainer.fit` stopped: `max_steps=900.0` reached.
2024-11-12 19:24:47,616	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=23574)[0m 
[36m(_train_tune pid=23574)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.54it/s][A
[36m(_train_tune pid=23574)[0m                                                                       [AEpoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.11, valid_loss=-2.05]Epoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.14, valid_loss=-2.05]Epoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.14, valid_loss=-2.05]


[36m(_train_tune pid=23926)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=23926)[0m Seed set to 42
[36m(_train_tune pid=23926)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=23926)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=23926)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=23926)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=23926)[0m 2024-11-12 19:24:55.659728: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


2024-11-12 19:24:59,907	ERROR tune_controller.py:1331 -- Trial task failed for trial _train_tune_d1d0fb02
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/ray/air/execution/_internal/event_manager.py", line 110, in resolve_future
    result = ray.get(future)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/auto_init_hook.py", line 21, in auto_init_wrapper
    return fn(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/client_mode_hook.py", line 103, in wrapper
    return func(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 2745, in get
    values, debugger_breakpoint = worker.get_objects(object_refs, timeout=timeout)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 901, in get_objects
    raise value.as_instanceof_cause()
ray.exceptions.RayTaskError(OutOfMemoryError): [36mray::ImplicitFunc.train()[39m (pid=23926, ip=172.28.0.12, actor_i


Trial _train_tune_d1d0fb02 errored after 0 iterations at 2024-11-12 19:24:59. Total running time: 30min 20s
Error file: /tmp/ray/session_2024-11-12_18-17-38_352630_2326/artifacts/2024-11-12_18-54-39/_train_tune_2024-11-12_18-54-39/driver_artifacts/_train_tune_d1d0fb02_27_batch_size=256,h=20,hist_exog_list=MA_2_9_MA_3_9_MA_1_12_MA_2_12_MA_3_12_MOM_9_MOM_12_RSI_7_RSI_14_EMA_3_9_2024-11-12_19-23-45/error.txt


[36m(_train_tune pid=24034)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=24034)[0m Seed set to 42
[36m(_train_tune pid=24034)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=24034)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=24034)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=24034)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=24034)[0m 2024-11-12 19:25:07.632481: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=-1.47]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.27, train_loss_epoch=-1.71]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.07, train_loss_epoch=-1.75]
Epoch 3: 100%|██████████| 7/7 [00:00<00:00, 20.52it/s, v_num=0, train_loss_step=-1.60, train_loss_epoch=-1.75]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.60, train_loss_epoch=-1.75]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.10, train_loss_epoch=-1.82]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.78]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.94, train_loss_epoch=-1.86]
E

2024-11-12 19:26:11,970	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=24034)[0m `Trainer.fit` stopped: `max_steps=900.0` reached.


[36m(_train_tune pid=24034)[0m 
[36m(_train_tune pid=24034)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.52it/s][A
[36m(_train_tune pid=24034)[0m                                                                       [AEpoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.11, valid_loss=-2.05]Epoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.14, valid_loss=-2.05]Epoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.14, valid_loss=-2.05]


[36m(_train_tune pid=24395)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=24395)[0m Seed set to 42
[36m(_train_tune pid=24395)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=24395)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=24395)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=24395)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=24395)[0m 2024-11-12 19:26:19.572183: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
                                                                           
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=-1.47]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.27, train_loss_epoch=-1.71]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.07, train_loss_epoch=-1.75]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.60, train_loss_epoch=-1.75]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.10, train_loss_epoch=-1.82]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.78]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.94, train_loss_epoch=-1.86]
Epoch 8:   0%|          | 0/7 [00:00

2024-11-12 19:27:25,452	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=24395)[0m `Trainer.fit` stopped: `max_steps=900.0` reached.


[36m(_train_tune pid=24395)[0m 
[36m(_train_tune pid=24395)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.51it/s][A
[36m(_train_tune pid=24395)[0m                                                                       [AEpoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.11, valid_loss=-2.05]Epoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.14, valid_loss=-2.05]Epoch 128:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.16, train_loss_epoch=-2.14, valid_loss=-2.05]


[36m(_train_tune pid=24764)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=24764)[0m Seed set to 42
[36m(_train_tune pid=24764)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=24764)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=24764)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=24764)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=24764)[0m 2024-11-12 19:27:33.670144: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=-1.47]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.27, train_loss_epoch=-1.71]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.07, train_loss_epoch=-1.75]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.60, train_loss_epoch=-1.75]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.10, train_loss_epoch=-1.82]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.78]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.94, train_loss_epoch=-1.86]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.65, train_loss_epoch=-1.82]
Epoch 9: 

[36m(_train_tune pid=24764)[0m `Trainer.fit` stopped: `max_steps=800.0` reached.
2024-11-12 19:28:33,676	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('MA(2,9)', 'MA(3,9)', 'MA(1,12)', 'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)', 'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)', 'DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
2024-11-12 19:28:33,700	INFO tune.py:1009 -- Wrote the latest version of all result files and experiment state to '/root/ray_results/_train_tune_2024-11-12_18-54-39' in 0.0206s.
2024-11-12 19:28:33,702	ERROR tune.py:1037 -- Trials did not complete: [_train_tune_be5546d3, _train_tune_e2f48f06, _train_tune_65a60f7c, _train_tune_64a1c5ae, _train_tune_d1d0fb02]
INFO:lightning_fabric.utilities.seed:Seed set to 42
INFO:pytorch_lightning.utilities.rank_zero

[36m(_train_tune pid=24764)[0m 
[36m(_train_tune pid=24764)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.55it/s][A
[36m(_train_tune pid=24764)[0m                                                                       [AEpoch 114:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.06, train_loss_epoch=-2.21, valid_loss=-2.04]Epoch 114:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.06, train_loss_epoch=-2.11, valid_loss=-2.04]Epoch 114:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-2.06, train_loss_epoch=-2.11, valid_loss=-2.04]



INFO:pytorch_lightning.accelerators.cuda:LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
INFO:pytorch_lightning.callbacks.model_summary:
  | Name         | Type             | Params | Mode 
----------------------------------------------------------
0 | loss         | DistributionLoss | 3      | eval 
1 | padder_train | ConstantPad1d    | 0      | train
2 | scaler       | TemporalNorm     | 0      | train
3 | blocks       | ModuleList       | 3.7 M  | train
----------------------------------------------------------
3.7 M     Trainable params
3         Non-trainable params
3.7 M     Total params
14.882    Total estimated model params size (MB)
33        Modules in train mode
1         Modules in eval mode


Sanity Checking: |          | 0/? [00:00<?, ?it/s]

Training: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

INFO:pytorch_lightning.utilities.rank_zero:`Trainer.fit` stopped: `max_steps=900.0` reached.
INFO:pytorch_lightning.utilities.rank_zero:GPU available: True (cuda), used: True
INFO:pytorch_lightning.utilities.rank_zero:TPU available: False, using: 0 TPU cores
INFO:pytorch_lightning.utilities.rank_zero:HPU available: False, using: 0 HPUs
INFO:pytorch_lightning.accelerators.cuda:LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]


Predicting: |          | 0/? [00:00<?, ?it/s]

Horizon 20 CV Minutes: 73.07346337238947


# Modelling half (12 years total, 6 train, 2 val, 4 test)

In [None]:
from neuralforecast.core import NeuralForecast
from ray import tune
from ray.tune.search.hyperopt import HyperOptSearch
from neuralforecast.losses.pytorch import DistributionLoss
from neuralforecast.auto import  AutoNHITS

In [None]:
df = pd.read_csv('Data/S&P500/3ProSP500.csv')
df['ds'] = pd.to_datetime(df['ds'])
df = df.astype({col: 'int32' if dtype == 'int64' else 'float32' if dtype == 'float64' else dtype
                for col, dtype in df.dtypes.items()})
df = df.rename(columns={'840E': 'y'})
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 2008545 entries, 0 to 2008544
Data columns (total 21 columns):
 #   Column     Dtype         
---  ------     -----         
 0   unique_id  object        
 1   ds         datetime64[ns]
 2   y          float32       
 3   MA(2,9)    int32         
 4   MA(3,9)    int32         
 5   MA(1,12)   int32         
 6   MA(2,12)   int32         
 7   MA(3,12)   int32         
 8   MOM(9)     int32         
 9   MOM(12)    int32         
 10  RSI(7)     int32         
 11  RSI(14)    int32         
 12  EMA(3,9)   int32         
 13  EMA(5,9)   int32         
 14  EMA(5,12)  int32         
 15  DY         float32       
 16  PTBV       float32       
 17  P          float32       
 18  PO         float32       
 19  VO         float32       
 20  PE         float32       
dtypes: datetime64[ns](1), float32(7), int32(12), object(1)
memory usage: 176.2+ MB


In [None]:
print(df['ds'].min().year, df['ds'].max().year)
print(df['ds'].max().year - df['ds'].min().year + 1)

2004 2023
20


In [None]:
# Calculate the starting year and add 8 years
starting_year = df['ds'].min().year + 8
# Create a new date range
new_start_date = pd.to_datetime(str(starting_year) + '-' + str(df['ds'].min().month) + '-' + str(df['ds'].min().day))
#Filter out the data based on the new starting year
df = df[df['ds'] >= new_start_date]
print(df['ds'].min().year, df['ds'].max().year)
print(df['ds'].max().year - df['ds'].min().year + 1)

2012 2023
12


In [None]:
start_2020_2023 = '2020-01-01'
end_2020_2023 = '2023-12-31'

start_2018_2019 = '2018-01-01'
end_2018_2019 = '2019-12-31'

# Filter the DataFrame for each time range and extract unique days
unique_days_2020_2023 = df[(df['ds'] >= start_2020_2023) & (df['ds'] <= end_2020_2023)]['ds'].dt.date.unique()
unique_days_2018_2019 = df[(df['ds'] >= start_2018_2019) & (df['ds'] <= end_2018_2019)]['ds'].dt.date.unique()

# Count the number of unique days in each range
count_unique_days_2020_2023 = len(unique_days_2020_2023)
count_unique_days_2018_2019 = len(unique_days_2018_2019)

# Create a summary DataFrame
summary_counts = pd.DataFrame({
    'Period': ['2020-2023', '2018-2019'],
    'Unique Days Covered': [count_unique_days_2020_2023, count_unique_days_2018_2019]
})
summary_counts

Unnamed: 0,Period,Unique Days Covered
0,2020-2023,1043
1,2018-2019,522


In [None]:
exog_list = list(df.columns)
exog_list.remove('ds')
exog_list.remove('y')
exog_list.remove('unique_id')

levels = [90]
val_size = count_unique_days_2018_2019
test_size = count_unique_days_2020_2023
horizons = [1, 5, 10, 20]

In [None]:
import os
from time import time

class AutoNHITSTrainer:
    def __init__(self, horizons, levels, exog_list, df, val_size, test_size):
        self.horizons = horizons
        self.levels = levels
        self.exog_list = exog_list
        self.df = df
        self.val_size = val_size
        self.test_size = test_size

    def check_existing_files(self, horizon):
        """Checks if model and CSV already exist for a given horizon."""
        model_path = f'Trained Models/AutoNHITS/8TYhorizon_{horizon}/'
        output_csv = f'Data/Test/8TYnhits_model0_1_horizon_{horizon}.csv'
        return os.path.exists(model_path) and os.path.exists(output_csv)

    def save_results(self, nf, horizon, Y_hat_df):
        """Saves the trained model and prediction results."""
        model_path = f'Trained Models/AutoNHITS/8TYhorizon_{horizon}/'
        output_csv = f'Data/Test/horizon_{horizon}/8TYnhits_model0_1_horizon_{horizon}.csv'

        # Create model directory if it doesn't exist
        os.makedirs(model_path, exist_ok=True)

        # Save the model, predictions and hyperparameter search
        for idx, model in enumerate(nf.models):
          hpo = f'HPO/horizon_{horizon}/8TYnhits_model{idx}_horizon_{horizon}_hpo.csv'
          results = model.results.get_dataframe()
          results.to_csv(hpo, index=False)

        nf.save(path=model_path, model_index=None, overwrite=True, save_dataset=False)

        for col in Y_hat_df.select_dtypes(include='float32').columns:
          Y_hat_df[col] = Y_hat_df[col].astype('float16')

        Y_hat_df.to_csv(output_csv, index=False)


    def configure_models(self, horizon):
        """Configures two AutoNHITS models for the given horizon."""
        # Model 0 Configuration
        nhits_config0 = AutoNHITS.get_default_config(h=horizon, backend="ray")
        nhits_config0['random_seed'] = 42
        nhits_config0['learning_rate'] = tune.choice([0.01, 0.005, 0.001, 0.0005, 0.0001, 0.0005, 0.0001, 0.00005, 0.00001])

        # Model 1 Configuration
        nhits_config1 = AutoNHITS.get_default_config(h=horizon, backend="ray")
        nhits_config1['hist_exog_list'] = self.exog_list
        nhits_config1['random_seed'] = 42
        nhits_config1['learning_rate'] = tune.choice([0.01, 0.005, 0.001, 0.0005, 0.0001, 0.0005, 0.0001, 0.00005, 0.00001])

        # Instantiate the models
        nhits_model0 = AutoNHITS(h=horizon,
                                 config=nhits_config0,
                                 search_alg=HyperOptSearch(), num_samples=30,
                                 backend='ray',
                                 loss=DistributionLoss(distribution='StudentT', level=self.levels),
                                 cpus = 12, gpus = 1)

        nhits_model1 = AutoNHITS(h=horizon,
                                 config=nhits_config1,
                                 search_alg=HyperOptSearch(), num_samples=30,
                                 backend='ray',
                                 loss=DistributionLoss(distribution='StudentT', level=self.levels),
                                 cpus = 12, gpus = 1)

        return nhits_model0, nhits_model1

    def run_training(self):
        """Runs the training loop over all horizons."""
        for horizon in self.horizons:
            if self.check_existing_files(horizon):
                print(f"Horizon {horizon}: Model and CSV already exist. Skipping this run.")
                continue

            # Configure the models
            nhits_model0, nhits_model1 = self.configure_models(horizon)

            # Start training and cross-validation
            init = time()
            nf = NeuralForecast(models=[nhits_model0, nhits_model1], freq='B')
            Y_hat_df = nf.cross_validation(df=self.df,
                                           val_size=self.val_size,
                                           test_size=self.test_size,
                                           n_windows=None)

            # Save results
            self.save_results(nf, horizon, Y_hat_df)

            # Log the time taken
            end = time()
            print(f'Horizon {horizon} CV Minutes: {(end - init) / 60}')

In [None]:
trainer = AutoNHITSTrainer(horizons, levels, exog_list, df, val_size, test_size)
trainer.run_training()

+--------------------------------------------------------------------+
| Configuration for experiment     _train_tune_2024-11-13_20-14-28   |
+--------------------------------------------------------------------+
| Search algorithm                 SearchGenerator                   |
| Scheduler                        FIFOScheduler                     |
| Number of trials                 30                                |
+--------------------------------------------------------------------+

View detailed results here: /root/ray_results/_train_tune_2024-11-13_20-14-28
To visualize your results with TensorBoard, run: `tensorboard --logdir /tmp/ray/session_2024-11-13_11-38-37_188179_3696/artifacts/2024-11-13_20-14-28/_train_tune_2024-11-13_20-14-28/driver_artifacts`


[36m(_train_tune pid=159411)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=159411)[0m Seed set to 42
[36m(_train_tune pid=159411)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=159411)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=159411)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=159411)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=159411)[0m 2024-11-13 20:14:35.8197

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/2 [00:00<?, ?it/s] 
Epoch 0: 100%|██████████| 2/2 [00:00<00:00,  6.62it/s, v_num=0, train_loss_step=0.874]
Epoch 1:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.874, train_loss_epoch=0.919]
Epoch 2:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.680, train_loss_epoch=0.732]
Epoch 3:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.497, train_loss_epoch=0.555]
Epoch 4:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.299, train_loss_epoch=0.352]
Epoch 5:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=0.0705, train_loss_epoch=0.133]
Epoch 6:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.195, train_loss_epoch=-0.128]
Epoch 7:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.494, train_loss_epoch=-0.417]
Epoch 8:   0%|      

2024-11-13 20:14:51,607	INFO tune.py:1009 -- Wrote the latest version of all result files and experiment state to '/root/ray_results/_train_tune_2024-11-13_20-14-28' in 0.0098s.


Epoch 68:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.34, train_loss_epoch=-1.34, valid_loss=-1.33]
Epoch 69:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.32, train_loss_epoch=-1.33, valid_loss=-1.33]
Epoch 70:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.34, train_loss_epoch=-1.32, valid_loss=-1.33]
Epoch 71:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.34, train_loss_epoch=-1.34, valid_loss=-1.33]
Epoch 72:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.34, train_loss_epoch=-1.34, valid_loss=-1.33]
Epoch 73:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.34, train_loss_epoch=-1.34, valid_loss=-1.33]
Epoch 74:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.35, train_loss_epoch=-1.34, valid_loss=-1.33]
Epoch 75:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.32, train_loss_epoch=-1.32, valid_loss=-1.33]
Epoch 76:   0%|         

Resume experiment with: Tuner.restore(path="/root/ray_results/_train_tune_2024-11-13_20-14-28", trainable=...)
- _train_tune_d6792489: FileNotFoundError('Could not fetch metrics for _train_tune_d6792489: both result.json and progress.csv were not found at /root/ray_results/_train_tune_2024-11-13_20-14-28/_train_tune_d6792489_2_batch_size=128,h=1,input_size=2,learning_rate=0.0005,loss=ref_ph_de895953,max_steps=600.0000,n_freq_downsam_2024-11-13_20-14-35')
INFO:lightning_fabric.utilities.seed:Seed set to 42
INFO:pytorch_lightning.utilities.rank_zero:GPU available: True (cuda), used: True
INFO:pytorch_lightning.utilities.rank_zero:TPU available: False, using: 0 TPU cores
INFO:pytorch_lightning.utilities.rank_zero:HPU available: False, using: 0 HPUs



[36m(_train_tune pid=159411)[0m 
[36m(_train_tune pid=159411)[0m Validation DataLoader 0: 100%|██████████| 2/2 [00:00<00:00,  5.21it/s][A


INFO:pytorch_lightning.accelerators.cuda:LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
INFO:pytorch_lightning.callbacks.model_summary:
  | Name         | Type             | Params | Mode 
----------------------------------------------------------
0 | loss         | DistributionLoss | 3      | eval 
1 | padder_train | ConstantPad1d    | 0      | train
2 | scaler       | TemporalNorm     | 0      | train
3 | blocks       | ModuleList       | 2.4 M  | train
----------------------------------------------------------
2.4 M     Trainable params
3         Non-trainable params
2.4 M     Total params
9.493     Total estimated model params size (MB)
33        Modules in train mode
1         Modules in eval mode


Sanity Checking: |          | 0/? [00:00<?, ?it/s]

Training: |          | 0/? [00:00<?, ?it/s]

# Modelling Technical Indicators (20 years total, 14 train, 2 val, 4 test)

In [None]:
from neuralforecast.core import NeuralForecast
from ray import tune
from ray.tune.search.hyperopt import HyperOptSearch
from neuralforecast.losses.pytorch import DistributionLoss
from neuralforecast.auto import AutoNHITS

In [None]:
df = pd.read_csv('Data/S&P500/3ProSP500.csv')
df['ds'] = pd.to_datetime(df['ds'])
df = df.astype({col: 'int32' if dtype == 'int64' else 'float32' if dtype == 'float64' else dtype
                for col, dtype in df.dtypes.items()})
df = df.rename(columns={'840E': 'y'})

selected_columns = [
    'unique_id', 'ds', 'y', 'MA(2,9)', 'MA(3,9)', 'MA(1,12)',
    'MA(2,12)', 'MA(3,12)', 'MOM(9)', 'MOM(12)', 'RSI(7)',
    'RSI(14)', 'EMA(3,9)', 'EMA(5,9)', 'EMA(5,12)'
]
df = df[selected_columns]

df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 2008545 entries, 0 to 2008544
Data columns (total 15 columns):
 #   Column     Dtype         
---  ------     -----         
 0   unique_id  object        
 1   ds         datetime64[ns]
 2   y          float32       
 3   MA(2,9)    int32         
 4   MA(3,9)    int32         
 5   MA(1,12)   int32         
 6   MA(2,12)   int32         
 7   MA(3,12)   int32         
 8   MOM(9)     int32         
 9   MOM(12)    int32         
 10  RSI(7)     int32         
 11  RSI(14)    int32         
 12  EMA(3,9)   int32         
 13  EMA(5,9)   int32         
 14  EMA(5,12)  int32         
dtypes: datetime64[ns](1), float32(1), int32(12), object(1)
memory usage: 130.3+ MB


In [None]:
start_2020_2023 = '2020-01-01'
end_2020_2023 = '2023-12-31'

start_2018_2019 = '2018-01-01'
end_2018_2019 = '2019-12-31'

# Filter the DataFrame for each time range and extract unique days
unique_days_2020_2023 = df[(df['ds'] >= start_2020_2023) & (df['ds'] <= end_2020_2023)]['ds'].dt.date.unique()
unique_days_2018_2019 = df[(df['ds'] >= start_2018_2019) & (df['ds'] <= end_2018_2019)]['ds'].dt.date.unique()

# Count the number of unique days in each range
count_unique_days_2020_2023 = len(unique_days_2020_2023)
count_unique_days_2018_2019 = len(unique_days_2018_2019)

# Create a summary DataFrame
summary_counts = pd.DataFrame({
    'Period': ['2020-2023', '2018-2019'],
    'Unique Days Covered': [count_unique_days_2020_2023, count_unique_days_2018_2019]
})
summary_counts

Unnamed: 0,Period,Unique Days Covered
0,2020-2023,1043
1,2018-2019,522


In [None]:
exog_list = list(df.columns)
exog_list.remove('ds')
exog_list.remove('y')
exog_list.remove('unique_id')
exog_list

['MA(2,9)',
 'MA(3,9)',
 'MA(1,12)',
 'MA(2,12)',
 'MA(3,12)',
 'MOM(9)',
 'MOM(12)',
 'RSI(7)',
 'RSI(14)',
 'EMA(3,9)',
 'EMA(5,9)',
 'EMA(5,12)']

In [None]:
levels = [90]
val_size = count_unique_days_2018_2019
test_size = count_unique_days_2020_2023
horizons = [1, 5, 10, 20]

In [None]:
import os
from time import time

class AutoNHITSTrainer:
    def __init__(self, horizons, levels, exog_list, df, val_size, test_size):
        self.horizons = horizons
        self.levels = levels
        self.exog_list = exog_list
        self.df = df
        self.val_size = val_size
        self.test_size = test_size

    def check_existing_files(self, horizon):
        """Checks if model and CSV already exist for a given horizon."""
        model_path = f'Trained Models/AutoNHITS/TECHhorizon_{horizon}/'
        output_csv = f'Data/Test/horizon_{horizon}/TECHnhits_model1_horizon_{horizon}.csv'
        return os.path.exists(model_path) and os.path.exists(output_csv)

    def save_results(self, nf, horizon, Y_hat_df):
        """Saves the trained model and prediction results."""
        model_path = f'Trained Models/AutoNHITS/TECHhorizon_{horizon}/'
        output_csv = f'Data/Test/horizon_{horizon}/TECHnhits_model1_horizon_{horizon}.csv'

        # Create model directory if it doesn't exist
        os.makedirs(model_path, exist_ok=True)

        # Save the model, predictions and hyperparameter search
        hpo = f'HPO/horizon_{horizon}/TECHnhits_model1_horizon_{horizon}_hpo.csv'
        results = nf.models[0].results.get_dataframe()
        results.to_csv(hpo, index=False)

        nf.save(path=model_path, model_index=None, overwrite=True, save_dataset=False)

        for col in Y_hat_df.select_dtypes(include='float32').columns:
            Y_hat_df[col] = Y_hat_df[col].astype('float16')

        Y_hat_df.to_csv(output_csv, index=False)

    def configure_model(self, horizon):
        """Configures the AutoNHITS model for the given horizon."""
        nhits_config = AutoNHITS.get_default_config(h=horizon, backend="ray")
        nhits_config['hist_exog_list'] = self.exog_list
        nhits_config['random_seed'] = 42
        nhits_config['learning_rate'] = tune.choice([0.01, 0.005, 0.001, 0.0005, 0.0001, 0.00005, 0.00001])

        # Instantiate the model
        nhits_model = AutoNHITS(h=horizon,
                            config=nhits_config,
                            search_alg=HyperOptSearch(), num_samples=30,
                            backend='ray',
                            loss=DistributionLoss(distribution='StudentT', level=self.levels),
                            cpus=12, gpus=1)

        return nhits_model

    def run_training(self):
        """Runs the training loop over all horizons."""
        for horizon in self.horizons:
            if self.check_existing_files(horizon):
                print(f"Horizon {horizon}: Model and CSV already exist. Skipping this run.")
                continue

            # Configure the model
            nhits_model = self.configure_model(horizon)

            # Start training and cross-validation
            init = time()
            nf = NeuralForecast(models=[nhits_model], freq='B')
            Y_hat_df = nf.cross_validation(df=self.df,
                                           val_size=self.val_size,
                                           test_size=self.test_size,
                                           n_windows=None)

            # Save results
            self.save_results(nf, horizon, Y_hat_df)

            # Log the time taken
            end = time()
            print(f'Horizon {horizon} CV Minutes: {(end - init) / 60}')

In [None]:
# Initialize and run the trainer
trainer = AutoNHITSTrainer(horizons, levels, exog_list, df, val_size, test_size)
trainer.run_training()

Output hidden; open in https://colab.research.google.com to view.

# Modelling Firm Indicators (20 years total, 14 train, 2 val, 4 test)

In [3]:
from neuralforecast.core import NeuralForecast
from ray import tune
from ray.tune.search.hyperopt import HyperOptSearch
from neuralforecast.losses.pytorch import DistributionLoss
from neuralforecast.auto import AutoNHITS

In [4]:
df = pd.read_csv('Data/S&P500/3ProSP500.csv')
df['ds'] = pd.to_datetime(df['ds'])
df = df.astype({col: 'int32' if dtype == 'int64' else 'float32' if dtype == 'float64' else dtype
                for col, dtype in df.dtypes.items()})
df = df.rename(columns={'840E': 'y'})

selected_columns = ['unique_id', 'ds', 'y', 'DY',  'PTBV',  'P',  'PO',  'VO',  'PE']
df = df[selected_columns]

df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 2008545 entries, 0 to 2008544
Data columns (total 9 columns):
 #   Column     Dtype         
---  ------     -----         
 0   unique_id  object        
 1   ds         datetime64[ns]
 2   y          float32       
 3   DY         float32       
 4   PTBV       float32       
 5   P          float32       
 6   PO         float32       
 7   VO         float32       
 8   PE         float32       
dtypes: datetime64[ns](1), float32(7), object(1)
memory usage: 84.3+ MB


In [5]:
print(df['ds'].min().year, df['ds'].max().year)
print(df['ds'].max().year - df['ds'].min().year + 1)

2004 2023
20


In [6]:
start_2020_2023 = '2020-01-01'
end_2020_2023 = '2023-12-31'

start_2018_2019 = '2018-01-01'
end_2018_2019 = '2019-12-31'

# Filter the DataFrame for each time range and extract unique days
unique_days_2020_2023 = df[(df['ds'] >= start_2020_2023) & (df['ds'] <= end_2020_2023)]['ds'].dt.date.unique()
unique_days_2018_2019 = df[(df['ds'] >= start_2018_2019) & (df['ds'] <= end_2018_2019)]['ds'].dt.date.unique()

# Count the number of unique days in each range
count_unique_days_2020_2023 = len(unique_days_2020_2023)
count_unique_days_2018_2019 = len(unique_days_2018_2019)

# Create a summary DataFrame
summary_counts = pd.DataFrame({
    'Period': ['2020-2023', '2018-2019'],
    'Unique Days Covered': [count_unique_days_2020_2023, count_unique_days_2018_2019]
})
summary_counts

Unnamed: 0,Period,Unique Days Covered
0,2020-2023,1043
1,2018-2019,522


In [7]:
exog_list = list(df.columns)
exog_list.remove('ds')
exog_list.remove('y')
exog_list.remove('unique_id')
exog_list

['DY', 'PTBV', 'P', 'PO', 'VO', 'PE']

In [8]:
levels = [90]
val_size = count_unique_days_2018_2019
test_size = count_unique_days_2020_2023
horizons = [1, 5, 10, 20]

In [9]:
import os
from time import time

class AutoNHITSTrainer:
    def __init__(self, horizons, levels, exog_list, df, val_size, test_size):
        self.horizons = horizons
        self.levels = levels
        self.exog_list = exog_list
        self.df = df
        self.val_size = val_size
        self.test_size = test_size

    def check_existing_files(self, horizon):
        """Checks if model and CSV already exist for a given horizon."""
        model_path = f'Trained Models/AutoNHITS/FIRMhorizon_{horizon}/'
        output_csv = f'Data/Test/horizon_{horizon}/FIRMnhits_model1_horizon_{horizon}.csv'
        return os.path.exists(model_path) and os.path.exists(output_csv)

    def save_results(self, nf, horizon, Y_hat_df):
        """Saves the trained model and prediction results."""
        model_path = f'Trained Models/AutoNHITS/FIRMhorizon_{horizon}/'
        output_csv = f'Data/Test/horizon_{horizon}/FIRMnhits_model1_horizon_{horizon}.csv'

        # Create model directory if it doesn't exist
        os.makedirs(model_path, exist_ok=True)

        # Save the model, predictions and hyperparameter search
        hpo = f'HPO/horizon_{horizon}/FIRMnhits_model1_horizon_{horizon}_hpo.csv'
        results = nf.models[0].results.get_dataframe()
        results.to_csv(hpo, index=False)

        nf.save(path=model_path, model_index=None, overwrite=True, save_dataset=False)

        for col in Y_hat_df.select_dtypes(include='float32').columns:
            Y_hat_df[col] = Y_hat_df[col].astype('float16')

        Y_hat_df.to_csv(output_csv, index=False)

    def configure_model(self, horizon):
        """Configures the AutoNHITS model for the given horizon."""
        nhits_config = AutoNHITS.get_default_config(h=horizon, backend="ray")
        nhits_config['hist_exog_list'] = self.exog_list
        nhits_config['random_seed'] = 42
        nhits_config['learning_rate'] = tune.choice([0.01, 0.005, 0.001, 0.0005, 0.0001, 0.00005, 0.00001])

        # Instantiate the model
        nhits_model = AutoNHITS(h=horizon,
                            config=nhits_config,
                            search_alg=HyperOptSearch(), num_samples=30,
                            backend='ray',
                            loss=DistributionLoss(distribution='StudentT', level=self.levels),
                            cpus=12, gpus=1)

        return nhits_model

    def run_training(self):
        """Runs the training loop over all horizons."""
        for horizon in self.horizons:
            if self.check_existing_files(horizon):
                print(f"Horizon {horizon}: Model and CSV already exist. Skipping this run.")
                continue

            # Configure the model
            nhits_model = self.configure_model(horizon)

            # Start training and cross-validation
            init = time()
            nf = NeuralForecast(models=[nhits_model], freq='B')
            Y_hat_df = nf.cross_validation(df=self.df,
                                           val_size=self.val_size,
                                           test_size=self.test_size,
                                           n_windows=None)

            # Save results
            self.save_results(nf, horizon, Y_hat_df)

            # Log the time taken
            end = time()
            print(f'Horizon {horizon} CV Minutes: {(end - init) / 60}')

In [None]:
# Initialize and run the trainer
trainer = AutoNHITSTrainer(horizons, levels, exog_list, df, val_size, test_size)
trainer.run_training()

Horizon 1: Model and CSV already exist. Skipping this run.
Horizon 5: Model and CSV already exist. Skipping this run.
Horizon 10: Model and CSV already exist. Skipping this run.


2024-11-18 13:03:36,165	INFO worker.py:1819 -- Started a local Ray instance.
2024-11-18 13:03:37,350	INFO tune.py:253 -- Initializing Ray automatically. For cluster usage or custom Ray initialization, call `ray.init(...)` before `Tuner(...)`.


+--------------------------------------------------------------------+
| Configuration for experiment     _train_tune_2024-11-18_13-03-34   |
+--------------------------------------------------------------------+
| Search algorithm                 SearchGenerator                   |
| Scheduler                        FIFOScheduler                     |
| Number of trials                 30                                |
+--------------------------------------------------------------------+

View detailed results here: /root/ray_results/_train_tune_2024-11-18_13-03-34
To visualize your results with TensorBoard, run: `tensorboard --logdir /tmp/ray/session_2024-11-18_13-03-34_336407_4396/artifacts/2024-11-18_13-03-37/_train_tune_2024-11-18_13-03-34/driver_artifacts`


[36m(_train_tune pid=5856)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=5856)[0m Seed set to 42
[36m(_train_tune pid=5856)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=5856)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=5856)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=5856)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=5856)[0m 2024-11-18 13:03:45.302446: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.10, train_loss_epoch=-0.888]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.16]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.35, train_loss_epoch=-1.13]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.984, train_loss_epoch=-1.17]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.50, train_loss_epoch=-1.21]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.06, train_loss_epoch=-1.17]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.842, train_loss_epoch=-1.15]
[36m(_train_tune pid=5856)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|  

2024-11-18 13:04:07,151	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (2, 2, 2), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=5856)[0m 
[36m(_train_tune pid=5856)[0m Validation: |          | 0/? [00:00<?, ?it/s][A
[36m(_train_tune pid=5856)[0m Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
[36m(_train_tune pid=5856)[0m Validation DataLoader 0:   0%|          | 0/13 [00:00<?, ?it/s][A


[36m(_train_tune pid=5856)[0m `Trainer.fit` stopped: `max_steps=800.0` reached.


[36m(_train_tune pid=5856)[0m 
[36m(_train_tune pid=5856)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 62.68it/s][A
[36m(_train_tune pid=5856)[0m                                                                         [AEpoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.22, train_loss_epoch=-1.26, valid_loss=-1.22]Epoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.22, train_loss_epoch=-1.28, valid_loss=-1.22]Epoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.22, train_loss_epoch=-1.28, valid_loss=-1.22]


[36m(_train_tune pid=6074)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=6074)[0m Seed set to 42
[36m(_train_tune pid=6074)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=6074)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=6074)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=6074)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=6074)[0m 2024-11-18 13:04:14.733451: I tensorfl

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=2.290, train_loss_epoch=11.70]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.986, train_loss_epoch=1.150]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.867, train_loss_epoch=-0.156]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.779, train_loss_epoch=-0.675]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.83, train_loss_epoch=-1.40]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.608, train_loss_epoch=-0.966]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=0.376, train_loss_epoch=0.266]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.127, train_loss_epoch=0.676]
Epoch 9:   0%|          | 0/7 [00:00<?, ?it/s, v_num

[36m(_train_tune pid=6074)[0m `Trainer.fit` stopped: `max_steps=1100.0` reached.
2024-11-18 13:05:10,031	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (180, 60, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=6074)[0m 
[36m(_train_tune pid=6074)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.73it/s][A
[36m(_train_tune pid=6074)[0m                                                                       [AEpoch 157:   0%|          | 0/7 [00:01<?, ?it/s, v_num=0, train_loss_step=-1.66, train_loss_epoch=-1.66, valid_loss=-1.64]Epoch 157:   0%|          | 0/7 [00:01<?, ?it/s, v_num=0, train_loss_step=-1.66, train_loss_epoch=-1.66, valid_loss=-1.64]Epoch 157:   0%|          | 0/7 [00:01<?, ?it/s, v_num=0, train_loss_step=-1.66, train_loss_epoch=-1.66, valid_loss=-1.64]


[36m(_train_tune pid=6417)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=6417)[0m Seed set to 42
[36m(_train_tune pid=6417)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=6417)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=6417)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=6417)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=6417)[0m 2024-11-18 13:05:17.701488: I tensorfl

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.86, train_loss_epoch=-0.785]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.44, train_loss_epoch=-0.922]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.11, train_loss_epoch=-0.877]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.712, train_loss_epoch=-0.878]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.42, train_loss_epoch=-1.01]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.767, train_loss_epoch=-0.942]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.466, train_loss_epoch=-0.902]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.621, train_loss_epoch=-0.945]
Epoch 9:   0%|          | 0/7 [00:00<?, ?it/s, v_

[36m(_train_tune pid=6417)[0m `Trainer.fit` stopped: `max_steps=600.0` reached.
2024-11-18 13:05:49,685	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=6417)[0m 
[36m(_train_tune pid=6417)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.81it/s][A
[36m(_train_tune pid=6417)[0m                                                                       [AEpoch 85:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.59, train_loss_epoch=-1.64, valid_loss=-1.60]Epoch 85:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.59, train_loss_epoch=-1.66, valid_loss=-1.60]Epoch 85:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.59, train_loss_epoch=-1.66, valid_loss=-1.60]


[36m(_train_tune pid=6651)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=6651)[0m Seed set to 42
[36m(_train_tune pid=6651)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=6651)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=6651)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=6651)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=6651)[0m 2024-11-18 13:05:57.762211: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/2 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.18, train_loss_epoch=-1.25]
Epoch 2:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.36, train_loss_epoch=-1.37]
Epoch 3:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.42, train_loss_epoch=-1.33]
Epoch 4:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.59, train_loss_epoch=-1.55]
Epoch 5:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.42, train_loss_epoch=-1.40]
Epoch 6:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.44, train_loss_epoch=-1.42]
Epoch 7:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.35, train_loss_epoch=-1.41]
Epoch 8:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.59, train_loss_epoch=-1.54]
Epoch 9: 

2024-11-18 13:06:40,647	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (24, 12, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=6651)[0m 
[36m(_train_tune pid=6651)[0m Validation DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 15.87it/s][A
[36m(_train_tune pid=6651)[0m 
[36m(_train_tune pid=6651)[0m                                                                       [AEpoch 349: 100%|██████████| 2/2 [00:00<00:00,  6.77it/s, v_num=0, train_loss_step=-1.68, train_loss_epoch=-1.59, valid_loss=-1.66]Epoch 349: 100%|██████████| 2/2 [00:00<00:00,  6.67it/s, v_num=0, train_loss_step=-1.68, train_loss_epoch=-1.63, valid_loss=-1.66]Epoch 349: 100%|██████████| 2/2 [00:00<00:00,  6.65it/s, v_num=0, train_loss_step=-1.68, train_loss_epoch=-1.63, valid_loss=-1.66]


[36m(_train_tune pid=6651)[0m `Trainer.fit` stopped: `max_steps=700.0` reached.
[36m(_train_tune pid=6937)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=6937)[0m Seed set to 42
[36m(_train_tune pid=6937)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=6937)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=6937)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=6937)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmu

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=2.930, train_loss_epoch=3.040]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.32, train_loss_epoch=-0.41]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.38, train_loss_epoch=-1.11]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.11, train_loss_epoch=-1.21]
Epoch 4: 100%|██████████| 4/4 [00:00<00:00, 26.58it/s, v_num=0, train_loss_step=-1.11, train_loss_epoch=-1.21]
Epoch 4: 100%|██████████| 4/4 [00:00<00:00, 26.39it/s, v_num=0, train_loss_step=-1.59, train_loss_epoch=-1.33]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.59, train_loss_epoch=-1.33]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.08, train_loss_epoch=-1.18]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/

[36m(_train_tune pid=6937)[0m `Trainer.fit` stopped: `max_steps=1100.0` reached.
2024-11-18 13:07:59,100	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (2, 2, 2), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=6937)[0m 
[36m(_train_tune pid=6937)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:01<00:00,  2.06it/s][A
[36m(_train_tune pid=6937)[0m                                                                       [AEpoch 274: 100%|██████████| 4/4 [00:02<00:00,  1.88it/s, v_num=0, train_loss_step=-0.845, train_loss_epoch=-1.34, valid_loss=-1.44]Epoch 274: 100%|██████████| 4/4 [00:02<00:00,  1.88it/s, v_num=0, train_loss_step=-0.845, train_loss_epoch=-1.31, valid_loss=-1.44]Epoch 274: 100%|██████████| 4/4 [00:02<00:00,  1.88it/s, v_num=0, train_loss_step=-0.845, train_loss_epoch=-1.31, valid_loss=-1.44]


[36m(_train_tune pid=7339)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=7339)[0m Seed set to 42
[36m(_train_tune pid=7339)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=7339)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=7339)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=7339)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=7339)[0m 2024-11-18 13:08:06.863852: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.32, train_loss_epoch=1.060]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.10, train_loss_epoch=-1.56]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.00, train_loss_epoch=-1.65]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.61, train_loss_epoch=-1.65]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.03, train_loss_epoch=-1.69]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.73]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.68, train_loss_epoch=-1.76]
[36m(_train_tune pid=7339)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|     

2024-11-18 13:08:25,351	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (8, 4, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=7339)[0m `Trainer.fit` stopped: `max_steps=800.0` reached.


[36m(_train_tune pid=7339)[0m 
[36m(_train_tune pid=7339)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 63.68it/s][A
[36m(_train_tune pid=7339)[0m                                                                         [AEpoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.90, train_loss_epoch=-1.91, valid_loss=-1.89]Epoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.90, train_loss_epoch=-1.93, valid_loss=-1.89]Epoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.90, train_loss_epoch=-1.93, valid_loss=-1.89]


[36m(_train_tune pid=7513)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=7513)[0m Seed set to 42
[36m(_train_tune pid=7513)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=7513)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=7513)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=7513)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=7513)[0m 2024-11-18 13:08:32.764791: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/2 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.16, train_loss_epoch=-0.865]
Epoch 2:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.921, train_loss_epoch=-0.919]
Epoch 3:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.21, train_loss_epoch=-1.14]
Epoch 4:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.00, train_loss_epoch=-1.06]
Epoch 5:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.01, train_loss_epoch=-1.01]
Epoch 6:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.19, train_loss_epoch=-1.06]
Epoch 7:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.03, train_loss_epoch=-1.05]
Epoch 8:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.10, train_loss_epoch=-1.06]
Epoch 

2024-11-18 13:09:51,493	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=7513)[0m `Trainer.fit` stopped: `max_steps=1300.0` reached.


[36m(_train_tune pid=7513)[0m 
[36m(_train_tune pid=7513)[0m Validation DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 15.13it/s][A
[36m(_train_tune pid=7513)[0m                                                                       [AEpoch 649: 100%|██████████| 2/2 [00:00<00:00,  6.46it/s, v_num=0, train_loss_step=-1.70, train_loss_epoch=-1.84, valid_loss=-1.69]Epoch 649: 100%|██████████| 2/2 [00:00<00:00,  6.44it/s, v_num=0, train_loss_step=-1.70, train_loss_epoch=-1.72, valid_loss=-1.69]Epoch 649: 100%|██████████| 2/2 [00:00<00:00,  6.42it/s, v_num=0, train_loss_step=-1.70, train_loss_epoch=-1.72, valid_loss=-1.69]


[36m(_train_tune pid=7948)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=7948)[0m Seed set to 42
[36m(_train_tune pid=7948)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=7948)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=7948)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=7948)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=7948)[0m 2024-11-18 13:09:59.664865: I tensorfl

[36m(_train_tune pid=7948)[0m Sanity Checking: |          | 0/? [00:00<?, ?it/s]
[36m(_train_tune pid=7948)[0m Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


2024-11-18 13:10:03,687	ERROR tune_controller.py:1331 -- Trial task failed for trial _train_tune_a76ac303
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/ray/air/execution/_internal/event_manager.py", line 110, in resolve_future
    result = ray.get(future)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/auto_init_hook.py", line 21, in auto_init_wrapper
    return fn(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/client_mode_hook.py", line 103, in wrapper
    return func(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 2753, in get
    values, debugger_breakpoint = worker.get_objects(object_refs, timeout=timeout)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 904, in get_objects
    raise value.as_instanceof_cause()
ray.exceptions.RayTaskError(OutOfMemoryError): [36mray::ImplicitFunc.train()[39m (pid=7948, ip=172.28.0.12, actor_id


Trial _train_tune_a76ac303 errored after 0 iterations at 2024-11-18 13:10:03. Total running time: 6min 26s
Error file: /tmp/ray/session_2024-11-18_13-03-34_336407_4396/artifacts/2024-11-18_13-03-37/_train_tune_2024-11-18_13-03-34/driver_artifacts/_train_tune_a76ac303_8_batch_size=256,h=20,hist_exog_list=DY_PTBV_P_PO_VO_PE,input_size=40,learning_rate=0.0050,loss=ref_ph_de8959_2024-11-18_13-08-32/error.txt


[36m(_train_tune pid=8058)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=8058)[0m Seed set to 42
[36m(_train_tune pid=8058)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=8058)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=8058)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=8058)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=8058)[0m 2024-11-18 13:10:11.811976: I tensorfl

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=1.600, train_loss_epoch=5.900]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.73, train_loss_epoch=-0.261]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.811, train_loss_epoch=-1.24]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.45, train_loss_epoch=-1.43]
Epoch 4: 100%|██████████| 7/7 [00:00<00:00, 40.06it/s, v_num=0, train_loss_step=-1.80, train_loss_epoch=-1.43]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.80, train_loss_epoch=-1.51]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.46, train_loss_epoch=-1.48]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.63]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_n

[36m(_train_tune pid=8058)[0m `Trainer.fit` stopped: `max_steps=900.0` reached.
2024-11-18 13:10:36,410	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (180, 60, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=8058)[0m 
[36m(_train_tune pid=8058)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:00<00:00, 38.63it/s][A
[36m(_train_tune pid=8058)[0m                                                                       [AEpoch 128:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.85, train_loss_epoch=-1.90, valid_loss=-1.84]Epoch 128:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.85, train_loss_epoch=-1.88, valid_loss=-1.84]Epoch 128:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.85, train_loss_epoch=-1.88, valid_loss=-1.84]


[36m(_train_tune pid=8248)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=8248)[0m Seed set to 42
[36m(_train_tune pid=8248)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=8248)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=8248)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=8248)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=8248)[0m 2024-11-18 13:10:43.787535: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=7.810, train_loss_epoch=12.60]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=7.240, train_loss_epoch=7.900]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=7.790, train_loss_epoch=7.930]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=7.110, train_loss_epoch=7.770]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=7.140, train_loss_epoch=7.470]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=6.440, train_loss_epoch=6.760]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=5.270, train_loss_epoch=6.070]
[36m(_train_tune pid=8248)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|     

[36m(_train_tune pid=8248)[0m `Trainer.fit` stopped: `max_steps=600.0` reached.
2024-11-18 13:10:58,591	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (168, 24, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=8248)[0m 
[36m(_train_tune pid=8248)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 71.15it/s][A
[36m(_train_tune pid=8248)[0m                                                                         [AEpoch 46:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=4.110, train_loss_epoch=4.070, valid_loss=4.170]Epoch 46:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=4.110, train_loss_epoch=4.090, valid_loss=4.170]Epoch 46:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=4.110, train_loss_epoch=4.090, valid_loss=4.170]


[36m(_train_tune pid=8405)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=8405)[0m Seed set to 42
[36m(_train_tune pid=8405)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=8405)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=8405)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=8405)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=8405)[0m 2024-11-18 13:11:06.712635: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.19, train_loss_epoch=-0.807]        
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.19, train_loss_epoch=-0.807]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.08, train_loss_epoch=-1.53]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.62, train_loss_epoch=-1.38]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.29, train_loss_epoch=-1.38]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.86, train_loss_epoch=-1.60]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.27, train_loss_epoch=-1.43]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.46, train_loss_epoch=-1.44]

2024-11-18 13:11:53,851	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (2, 2, 2), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=8405)[0m `Trainer.fit` stopped: `max_steps=1500.0` reached.


[36m(_train_tune pid=8405)[0m 
[36m(_train_tune pid=8405)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:00<00:00, 23.36it/s][A
[36m(_train_tune pid=8405)[0m                                                                       [AEpoch 374: 100%|██████████| 4/4 [00:00<00:00, 13.23it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.85, valid_loss=-1.75]Epoch 374: 100%|██████████| 4/4 [00:00<00:00, 13.20it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.86, valid_loss=-1.75]Epoch 374: 100%|██████████| 4/4 [00:00<00:00, 13.15it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.86, valid_loss=-1.75]


[36m(_train_tune pid=8693)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=8693)[0m Seed set to 42
[36m(_train_tune pid=8693)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=8693)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=8693)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=8693)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=8693)[0m 2024-11-18 13:12:01.803575: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00,  2.23it/s]
                                                                           
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=7.260, train_loss_epoch=20.70]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=7.000, train_loss_epoch=7.420]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=7.860, train_loss_epoch=7.810]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=7.170, train_loss_epoch=7.710]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=7.950, train_loss_epoch=8.040]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=8.300, train_loss_epoch=8.140]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_l

2024-11-18 13:12:39,643	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (24, 12, 1), 'n_pool_kernel_size': (1, 1, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=8693)[0m `Trainer.fit` stopped: `max_steps=1200.0` reached.


[36m(_train_tune pid=8693)[0m 
[36m(_train_tune pid=8693)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:00<00:00, 27.33it/s][A
[36m(_train_tune pid=8693)[0m                                                                       [AEpoch 299: 100%|██████████| 4/4 [00:00<00:00, 14.37it/s, v_num=0, train_loss_step=3.380, train_loss_epoch=4.220, valid_loss=4.060]Epoch 299: 100%|██████████| 4/4 [00:00<00:00, 14.32it/s, v_num=0, train_loss_step=3.380, train_loss_epoch=3.820, valid_loss=4.060]Epoch 299: 100%|██████████| 4/4 [00:00<00:00, 14.27it/s, v_num=0, train_loss_step=3.380, train_loss_epoch=3.820, valid_loss=4.060]


[36m(_train_tune pid=8945)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=8945)[0m Seed set to 42
[36m(_train_tune pid=8945)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=8945)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=8945)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=8945)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=8945)[0m 2024-11-18 13:12:47.825916: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=7.050, train_loss_epoch=73.70]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=6.660, train_loss_epoch=7.130]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=7.260, train_loss_epoch=7.320]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=6.800, train_loss_epoch=7.340]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=7.350, train_loss_epoch=7.420]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=7.610, train_loss_epoch=7.490]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=6.510, train_loss_epoch=7.310]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=7.130, train_loss_epoch=7.370]
Epoch 9: 

2024-11-18 13:13:53,226	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (40, 20, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=8945)[0m `Trainer.fit` stopped: `max_steps=1400.0` reached.


[36m(_train_tune pid=8945)[0m 
[36m(_train_tune pid=8945)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:01<00:00,  3.84it/s][A
[36m(_train_tune pid=8945)[0m                                                                       [AEpoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.47it/s, v_num=0, train_loss_step=4.100, train_loss_epoch=4.250, valid_loss=4.150]Epoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.47it/s, v_num=0, train_loss_step=4.100, train_loss_epoch=4.230, valid_loss=4.150]Epoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.46it/s, v_num=0, train_loss_step=4.100, train_loss_epoch=4.230, valid_loss=4.150]


[36m(_train_tune pid=9309)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=9309)[0m Seed set to 42
[36m(_train_tune pid=9309)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=9309)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=9309)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=9309)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=9309)[0m 2024-11-18 13:14:00.867880: I tensorfl

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.38, train_loss_epoch=-1.18]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.15, train_loss_epoch=-1.54]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.75, train_loss_epoch=-1.52]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.37, train_loss_epoch=-1.50]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.92, train_loss_epoch=-1.60]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.29, train_loss_epoch=-1.57]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.71, train_loss_epoch=-1.64]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.34, train_loss_epoch=-1.59]
Epoch 9:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, trai

2024-11-18 13:14:27,911	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (8, 4, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=9309)[0m `Trainer.fit` stopped: `max_steps=500.0` reached.


[36m(_train_tune pid=9309)[0m 
[36m(_train_tune pid=9309)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:02<00:00,  3.46it/s][A
[36m(_train_tune pid=9309)[0m                                                                       [AEpoch 71:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.71, train_loss_epoch=-1.62, valid_loss=-1.73] Epoch 71:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.71, train_loss_epoch=-1.66, valid_loss=-1.73]Epoch 71:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.71, train_loss_epoch=-1.66, valid_loss=-1.73]


[36m(_train_tune pid=9517)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=9517)[0m Seed set to 42
[36m(_train_tune pid=9517)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=9517)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=9517)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=9517)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=9517)[0m 2024-11-18 13:14:35.854054: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.786, train_loss_epoch=-0.273]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.45, train_loss_epoch=-1.01]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.52, train_loss_epoch=-1.17]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.869, train_loss_epoch=-1.16]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.58, train_loss_epoch=-1.33]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.19, train_loss_epoch=-1.34]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.27, train_loss_epoch=-1.38]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.951, train_loss_epoch=-1.26]
Epoch

[36m(_train_tune pid=9517)[0m `Trainer.fit` stopped: `max_steps=600.0` reached.
2024-11-18 13:15:08,097	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=9517)[0m 
[36m(_train_tune pid=9517)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:02<00:00,  3.39it/s][A
[36m(_train_tune pid=9517)[0m                                                                       [AEpoch 85:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.57, train_loss_epoch=-1.67, valid_loss=-1.64]Epoch 85:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.57, train_loss_epoch=-1.70, valid_loss=-1.64]Epoch 85:   0%|          | 0/7 [00:02<?, ?it/s, v_num=0, train_loss_step=-1.57, train_loss_epoch=-1.70, valid_loss=-1.64]


[36m(_train_tune pid=9743)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=9743)[0m Seed set to 42
[36m(_train_tune pid=9743)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=9743)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=9743)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=9743)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=9743)[0m 2024-11-18 13:15:15.871451: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.06, train_loss_epoch=1.490]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-1.54]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.82, train_loss_epoch=-1.55]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.60, train_loss_epoch=-1.59]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.17, train_loss_epoch=-1.68]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.61, train_loss_epoch=-1.67]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.70, train_loss_epoch=-1.67]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=-1.66]
Epoch 9: 

[36m(_train_tune pid=9743)[0m `Trainer.fit` stopped: `max_steps=1200.0` reached.
2024-11-18 13:15:46,166	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (180, 60, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=9743)[0m 
[36m(_train_tune pid=9743)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:00<00:00, 38.67it/s][A
[36m(_train_tune pid=9743)[0m                                                                       [AEpoch 171:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.97, valid_loss=-1.94]Epoch 171:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.95, valid_loss=-1.94]Epoch 171:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.95, train_loss_epoch=-1.95, valid_loss=-1.94]


[36m(_train_tune pid=9957)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=9957)[0m Seed set to 42
[36m(_train_tune pid=9957)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=9957)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=9957)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=9957)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=9957)[0m 2024-11-18 13:15:53.820142: I tensorfl

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=14.20, train_loss_epoch=40.50]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=14.80, train_loss_epoch=15.30]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=16.50, train_loss_epoch=16.10]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=15.10, train_loss_epoch=15.90]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=16.30, train_loss_epoch=16.50]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=15.90, train_loss_epoch=15.80]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=32.50, train_loss_epoch=19.50]
Epoch 8:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=15.30, train_loss_epoch=15.80]
Epoch 9: 

2024-11-18 13:16:23,435	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (180, 60, 1), 'n_pool_kernel_size': (2, 2, 2), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=9957)[0m `Trainer.fit` stopped: `max_steps=900.0` reached.


[36m(_train_tune pid=9957)[0m 
[36m(_train_tune pid=9957)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:00<00:00, 27.65it/s][A
[36m(_train_tune pid=9957)[0m                                                                       [AEpoch 224: 100%|██████████| 4/4 [00:00<00:00, 14.61it/s, v_num=0, train_loss_step=9.380, train_loss_epoch=9.450, valid_loss=9.300]Epoch 224: 100%|██████████| 4/4 [00:00<00:00, 14.56it/s, v_num=0, train_loss_step=9.380, train_loss_epoch=9.600, valid_loss=9.300]Epoch 224: 100%|██████████| 4/4 [00:00<00:00, 14.51it/s, v_num=0, train_loss_step=9.380, train_loss_epoch=9.600, valid_loss=9.300]


[36m(_train_tune pid=10171)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=10171)[0m Seed set to 42
[36m(_train_tune pid=10171)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=10171)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=10171)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=10171)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=10171)[0m 2024-11-18 13:16:30.876847: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00,  2.25it/s]
                                                                           
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=18.50, train_loss_epoch=103.0]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=8.950, train_loss_epoch=11.20]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=8.080, train_loss_epoch=8.820]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=7.540, train_loss_epoch=8.050]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=7.290, train_loss_epoch=7.520]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=7.100, train_loss_epoch=7.160]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_l

2024-11-18 13:17:25,485	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (1, 1, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=10171)[0m Epoch 374: 100%|██████████| 4/4 [00:00<00:00, 35.51it/s, v_num=0, train_loss_step=5.550, train_loss_epoch=5.150, valid_loss=5.320]Epoch 374: 100%|██████████| 4/4 [00:00<00:00, 35.18it/s, v_num=0, train_loss_step=5.300, train_loss_epoch=5.150, valid_loss=5.320]
[36m(_train_tune pid=10171)[0m Validation: |          | 0/? [00:00<?, ?it/s][A
[36m(_train_tune pid=10171)[0m Validation:   0%|          | 0/4 [00:00<?, ?it/s][A
[36m(_train_tune pid=10171)[0m Validation DataLoader 0:   0%|          | 0/4 [00:00<?, ?it/s][A


[36m(_train_tune pid=10171)[0m `Trainer.fit` stopped: `max_steps=1500.0` reached.


[36m(_train_tune pid=10171)[0m 
[36m(_train_tune pid=10171)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:00<00:00, 28.17it/s][A
[36m(_train_tune pid=10171)[0m                                                                       [AEpoch 374: 100%|██████████| 4/4 [00:00<00:00, 14.12it/s, v_num=0, train_loss_step=5.300, train_loss_epoch=5.150, valid_loss=5.280]Epoch 374: 100%|██████████| 4/4 [00:00<00:00, 14.07it/s, v_num=0, train_loss_step=5.300, train_loss_epoch=5.110, valid_loss=5.280]Epoch 374: 100%|██████████| 4/4 [00:00<00:00, 14.03it/s, v_num=0, train_loss_step=5.300, train_loss_epoch=5.110, valid_loss=5.280]


[36m(_train_tune pid=10489)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=10489)[0m Seed set to 42
[36m(_train_tune pid=10489)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=10489)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=10489)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=10489)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=10489)[0m 2024-11-18 13:17:32.768005: I t

[36m(_train_tune pid=10489)[0m Sanity Checking: |          | 0/? [00:00<?, ?it/s]
[36m(_train_tune pid=10489)[0m Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


2024-11-18 13:17:36,812	ERROR tune_controller.py:1331 -- Trial task failed for trial _train_tune_423843ea
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/ray/air/execution/_internal/event_manager.py", line 110, in resolve_future
    result = ray.get(future)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/auto_init_hook.py", line 21, in auto_init_wrapper
    return fn(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/client_mode_hook.py", line 103, in wrapper
    return func(*args, **kwargs)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 2753, in get
    values, debugger_breakpoint = worker.get_objects(object_refs, timeout=timeout)
  File "/usr/local/lib/python3.10/dist-packages/ray/_private/worker.py", line 904, in get_objects
    raise value.as_instanceof_cause()
ray.exceptions.RayTaskError(OutOfMemoryError): [36mray::ImplicitFunc.train()[39m (pid=10489, ip=172.28.0.12, actor_i


Trial _train_tune_423843ea errored after 0 iterations at 2024-11-18 13:17:36. Total running time: 13min 59s
Error file: /tmp/ray/session_2024-11-18_13-03-34_336407_4396/artifacts/2024-11-18_13-03-37/_train_tune_2024-11-18_13-03-34/driver_artifacts/_train_tune_423843ea_19_batch_size=256,h=20,hist_exog_list=DY_PTBV_P_PO_VO_PE,input_size=80,learning_rate=0.0000,loss=ref_ph_de895_2024-11-18_13-16-30/error.txt


[36m(_train_tune pid=10599)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=10599)[0m Seed set to 42
[36m(_train_tune pid=10599)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=10599)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=10599)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=10599)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=10599)[0m 2024-11-18 13:17:44.772396: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=9.320, train_loss_epoch=37.80]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=9.140, train_loss_epoch=9.960]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=10.10, train_loss_epoch=10.20]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=9.240, train_loss_epoch=9.970]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=9.880, train_loss_epoch=10.20]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=10.10, train_loss_epoch=10.00]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=9.820, train_loss_epoch=9.960]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=9.520, train_loss_epoch=9.890]
Epoch 9: 

2024-11-18 13:18:15,044	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (2, 2, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=10599)[0m `Trainer.fit` stopped: `max_steps=1200.0` reached.


[36m(_train_tune pid=10599)[0m 
[36m(_train_tune pid=10599)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:00<00:00, 40.46it/s][A
[36m(_train_tune pid=10599)[0m                                                                       [AEpoch 171:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.09, train_loss_epoch=-1.11, valid_loss=-1.18]Epoch 171:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.09, train_loss_epoch=-1.14, valid_loss=-1.18]Epoch 171:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.09, train_loss_epoch=-1.14, valid_loss=-1.18]


[36m(_train_tune pid=10819)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=10819)[0m Seed set to 42
[36m(_train_tune pid=10819)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=10819)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=10819)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=10819)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=10819)[0m 2024-11-18 13:18:22.866769: I t

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/7 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.27, train_loss_epoch=-1.36]
Epoch 2:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.94, train_loss_epoch=-1.43]
Epoch 3:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.58, train_loss_epoch=-1.37]
Epoch 4:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.30, train_loss_epoch=-1.38]
Epoch 5:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.75, train_loss_epoch=-1.44]
Epoch 6:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.23, train_loss_epoch=-1.37]
Epoch 7:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.45, train_loss_epoch=-1.37]
Epoch 8:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.22, train_loss_epoch=-1.39]
Epoch 9:   0%|          | 0/7 [00:00<?, ?it/s, v_num=0, trai

[36m(_train_tune pid=10819)[0m `Trainer.fit` stopped: `max_steps=1400.0` reached.
2024-11-18 13:19:33,249	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (1, 1, 1), 'n_pool_kernel_size': (2, 2, 2), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=10819)[0m 
[36m(_train_tune pid=10819)[0m Validation DataLoader 0: 100%|██████████| 7/7 [00:02<00:00,  3.43it/s][A
[36m(_train_tune pid=10819)[0m                                                                       [AEpoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.12it/s, v_num=0, train_loss_step=-1.72, train_loss_epoch=-1.94, valid_loss=-1.88]Epoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.12it/s, v_num=0, train_loss_step=-1.72, train_loss_epoch=-1.85, valid_loss=-1.88]Epoch 199: 100%|██████████| 7/7 [00:02<00:00,  3.12it/s, v_num=0, train_loss_step=-1.72, train_loss_epoch=-1.85, valid_loss=-1.88]


[36m(_train_tune pid=11207)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=11207)[0m Seed set to 42
[36m(_train_tune pid=11207)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=11207)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=11207)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=11207)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=11207)[0m 2024-11-18 13:19:40.817861: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/4 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.10, train_loss_epoch=-0.753]
Epoch 2:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.98, train_loss_epoch=-1.36]
Epoch 3:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.67, train_loss_epoch=-1.47]
Epoch 4:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.36, train_loss_epoch=-1.46]
Epoch 5:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.84, train_loss_epoch=-1.58]
Epoch 6:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.34, train_loss_epoch=-1.48]
Epoch 7:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.70, train_loss_epoch=-1.63]
Epoch 8:   0%|          | 0/4 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.28, train_loss_epoch=-1.51]
Epoch 9:

2024-11-18 13:20:53,011	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (24, 12, 1), 'n_pool_kernel_size': (16, 8, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=11207)[0m `Trainer.fit` stopped: `max_steps=1200.0` reached.


[36m(_train_tune pid=11207)[0m 
[36m(_train_tune pid=11207)[0m Validation DataLoader 0: 100%|██████████| 4/4 [00:01<00:00,  2.14it/s][A
[36m(_train_tune pid=11207)[0m                                                                       [AEpoch 299: 100%|██████████| 4/4 [00:02<00:00,  1.96it/s, v_num=0, train_loss_step=-1.80, train_loss_epoch=-1.74, valid_loss=-1.76]Epoch 299: 100%|██████████| 4/4 [00:02<00:00,  1.96it/s, v_num=0, train_loss_step=-1.80, train_loss_epoch=-1.80, valid_loss=-1.76]Epoch 299: 100%|██████████| 4/4 [00:02<00:00,  1.96it/s, v_num=0, train_loss_step=-1.80, train_loss_epoch=-1.80, valid_loss=-1.76]


[36m(_train_tune pid=11597)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=11597)[0m Seed set to 42
[36m(_train_tune pid=11597)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=11597)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=11597)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=11597)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=11597)[0m 2024-11-18 13:21:00.835196: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=4.020]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.12, train_loss_epoch=-1.59]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.96, train_loss_epoch=-1.66]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.57, train_loss_epoch=-1.69]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.01, train_loss_epoch=-1.75]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.65, train_loss_epoch=-1.75]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.86, train_loss_epoch=-1.78]
[36m(_train_tune pid=11597)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|    

2024-11-18 13:21:23,201	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (8, 4, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=11597)[0m 
[36m(_train_tune pid=11597)[0m Validation: |          | 0/? [00:00<?, ?it/s][A
[36m(_train_tune pid=11597)[0m Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
[36m(_train_tune pid=11597)[0m Validation DataLoader 0:   0%|          | 0/13 [00:00<?, ?it/s][A


[36m(_train_tune pid=11597)[0m `Trainer.fit` stopped: `max_steps=1000.0` reached.


[36m(_train_tune pid=11597)[0m 
[36m(_train_tune pid=11597)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 66.99it/s][A
[36m(_train_tune pid=11597)[0m                                                                         [AEpoch 76:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.93, train_loss_epoch=-1.85, valid_loss=-1.82]Epoch 76:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.93, train_loss_epoch=-1.84, valid_loss=-1.82]Epoch 76:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.93, train_loss_epoch=-1.84, valid_loss=-1.82]


[36m(_train_tune pid=11782)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=11782)[0m Seed set to 42
[36m(_train_tune pid=11782)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=11782)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=11782)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=11782)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=11782)[0m 2024-11-18 13:21:30.829160: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
                                                                           
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.663, train_loss_epoch=0.338]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.13, train_loss_epoch=-1.28]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.91, train_loss_epoch=-1.53]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.57, train_loss_epoch=-1.68]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.98, train_loss_epoch=-1.74]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.64, train_loss_epoch=-1.72]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.89, train_loss_epoch=-1.81]
[36m(_train_tune pid=11782

2024-11-18 13:21:49,511	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=11782)[0m `Trainer.fit` stopped: `max_steps=800.0` reached.


[36m(_train_tune pid=11782)[0m 
[36m(_train_tune pid=11782)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 65.98it/s][A
[36m(_train_tune pid=11782)[0m                                                                         [AEpoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.00, train_loss_epoch=-2.01, valid_loss=-1.92]Epoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.00, train_loss_epoch=-2.01, valid_loss=-1.92]Epoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.00, train_loss_epoch=-2.01, valid_loss=-1.92]


[36m(_train_tune pid=11951)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=11951)[0m Seed set to 42
[36m(_train_tune pid=11951)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=11951)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=11951)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=11951)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=11951)[0m 2024-11-18 13:21:56.858499: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.47, train_loss_epoch=2.500]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.15, train_loss_epoch=-1.62]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.84, train_loss_epoch=-1.63]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.65, train_loss_epoch=-1.64]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.06, train_loss_epoch=-1.68]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.68, train_loss_epoch=-1.66]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.73, train_loss_epoch=-1.68]
[36m(_train_tune pid=11951)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|    

[36m(_train_tune pid=11951)[0m `Trainer.fit` stopped: `max_steps=1000.0` reached.
2024-11-18 13:22:18,863	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (8, 4, 1), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=11951)[0m 
[36m(_train_tune pid=11951)[0m Validation: |          | 0/? [00:00<?, ?it/s][A
[36m(_train_tune pid=11951)[0m Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
[36m(_train_tune pid=11951)[0m Validation DataLoader 0:   0%|          | 0/13 [00:00<?, ?it/s][A
[36m(_train_tune pid=11951)[0m 
[36m(_train_tune pid=11951)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 67.19it/s][A
[36m(_train_tune pid=11951)[0m 
[36m(_train_tune pid=11951)[0m                                                                         [AEpoch 76:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.78, train_loss_epoch=-1.88, valid_loss=-1.82]Epoch 76:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.78, train_loss_epoch=-1.83, valid_loss=-1.82]
[36m(_train_tune pid=11951)[0m Epoch 76:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.78, train_loss_epoch=-1.83, valid_loss=-1.82]


[36m(_train_tune pid=12136)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=12136)[0m Seed set to 42
[36m(_train_tune pid=12136)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=12136)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=12136)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=12136)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=12136)[0m 2024-11-18 13:22:26.952896: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/2 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=2.310, train_loss_epoch=0.496]
Epoch 2:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.14, train_loss_epoch=-0.557]
Epoch 3:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.10, train_loss_epoch=-1.20]
Epoch 4:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.43, train_loss_epoch=-1.35]
Epoch 5:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.40, train_loss_epoch=-1.34]
Epoch 6:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.50, train_loss_epoch=-1.46]
Epoch 7:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.51, train_loss_epoch=-1.52]
Epoch 8:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.63, train_loss_epoch=-1.56]
Epoch 9:

2024-11-18 13:23:20,719	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (180, 60, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=12136)[0m Epoch 449: 100%|██████████| 2/2 [00:00<00:00, 19.09it/s, v_num=0, train_loss_step=-2.06, train_loss_epoch=-2.04, valid_loss=-1.89]Epoch 449: 100%|██████████| 2/2 [00:00<00:00, 19.01it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-2.04, valid_loss=-1.89]
[36m(_train_tune pid=12136)[0m Validation: |          | 0/? [00:00<?, ?it/s][A
[36m(_train_tune pid=12136)[0m Validation:   0%|          | 0/2 [00:00<?, ?it/s][A
[36m(_train_tune pid=12136)[0m Validation DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s][A
[36m(_train_tune pid=12136)[0m 
[36m(_train_tune pid=12136)[0m Validation DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 15.89it/s][A


[36m(_train_tune pid=12136)[0m `Trainer.fit` stopped: `max_steps=900.0` reached.


[36m(_train_tune pid=12136)[0m 
[36m(_train_tune pid=12136)[0m                                                                       [AEpoch 449: 100%|██████████| 2/2 [00:00<00:00,  6.77it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-2.04, valid_loss=-1.90]Epoch 449: 100%|██████████| 2/2 [00:00<00:00,  6.74it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-2.00, valid_loss=-1.90]Epoch 449: 100%|██████████| 2/2 [00:00<00:00,  6.72it/s, v_num=0, train_loss_step=-2.05, train_loss_epoch=-2.00, valid_loss=-1.90]


[36m(_train_tune pid=12455)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=12455)[0m Seed set to 42
[36m(_train_tune pid=12455)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=12455)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=12455)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=12455)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=12455)[0m 2024-11-18 13:23:28.979889: I t

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.44, train_loss_epoch=-0.979]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.21, train_loss_epoch=-1.64]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.03, train_loss_epoch=-1.69]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.63, train_loss_epoch=-1.68]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.11, train_loss_epoch=-1.79]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.78, train_loss_epoch=-1.82]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.87, train_loss_epoch=-1.80]
[36m(_train_tune pid=12455)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
Validation DataLo

2024-11-18 13:23:52,824	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=12455)[0m `Trainer.fit` stopped: `max_steps=1100.0` reached.


[36m(_train_tune pid=12455)[0m 
[36m(_train_tune pid=12455)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 66.34it/s][A
[36m(_train_tune pid=12455)[0m                                                                         [AEpoch 84:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.77, train_loss_epoch=-1.96, valid_loss=-1.93]Epoch 84:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.77, train_loss_epoch=-1.95, valid_loss=-1.93]Epoch 84:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.77, train_loss_epoch=-1.95, valid_loss=-1.93]


[36m(_train_tune pid=12648)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=12648)[0m Seed set to 42
[36m(_train_tune pid=12648)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=12648)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=12648)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=12648)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=12648)[0m 2024-11-18 13:24:00.908263: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-0.663, train_loss_epoch=0.338]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.13, train_loss_epoch=-1.28]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.91, train_loss_epoch=-1.53]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.57, train_loss_epoch=-1.68]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.98, train_loss_epoch=-1.74]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.64, train_loss_epoch=-1.72]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.89, train_loss_epoch=-1.81]
[36m(_train_tune pid=12648)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|   

2024-11-18 13:24:19,278	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}
[36m(_train_tune pid=12648)[0m `Trainer.fit` stopped: `max_steps=800.0` reached.


[36m(_train_tune pid=12648)[0m 
[36m(_train_tune pid=12648)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 64.95it/s][A
[36m(_train_tune pid=12648)[0m                                                                         [AEpoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.00, train_loss_epoch=-2.01, valid_loss=-1.92]Epoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.00, train_loss_epoch=-2.01, valid_loss=-1.92]Epoch 61:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.00, train_loss_epoch=-2.01, valid_loss=-1.92]


[36m(_train_tune pid=12817)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=12817)[0m Seed set to 42
[36m(_train_tune pid=12817)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=12817)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=12817)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=12817)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=12817)[0m 2024-11-18 13:24:26.907458: I t

Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/2 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.32, train_loss_epoch=-1.31]
Epoch 2:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.59, train_loss_epoch=-1.53]
Epoch 3:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.55, train_loss_epoch=-1.48]
Epoch 4:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.51, train_loss_epoch=-1.53]
Epoch 5:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.63, train_loss_epoch=-1.60]
Epoch 6:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.68, train_loss_epoch=-1.67]
Epoch 7:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.79, train_loss_epoch=-1.71]
Epoch 8:   0%|          | 0/2 [00:00<?, ?it/s, v_num=0, t

[36m(_train_tune pid=12817)[0m `Trainer.fit` stopped: `max_steps=1300.0` reached.
2024-11-18 13:25:43,875	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (180, 60, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}


[36m(_train_tune pid=12817)[0m Epoch 649: 100%|██████████| 2/2 [00:00<00:00, 18.90it/s, v_num=0, train_loss_step=-2.22, train_loss_epoch=-2.22, valid_loss=-1.92]Epoch 649: 100%|██████████| 2/2 [00:00<00:00, 18.83it/s, v_num=0, train_loss_step=-2.21, train_loss_epoch=-2.22, valid_loss=-1.92]
[36m(_train_tune pid=12817)[0m Validation: |          | 0/? [00:00<?, ?it/s][A
[36m(_train_tune pid=12817)[0m Validation:   0%|          | 0/2 [00:00<?, ?it/s][A
[36m(_train_tune pid=12817)[0m Validation DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s][A
[36m(_train_tune pid=12817)[0m 
[36m(_train_tune pid=12817)[0m Validation DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 16.02it/s][A
[36m(_train_tune pid=12817)[0m                                                                       [AEpoch 649: 100%|██████████| 2/2 [00:00<00:00,  6.78it/s, v_num=0, train_loss_step=-2.21, train_loss_epoch=-2.22, valid_loss=-1.93]Epoch 649: 100%|██████████| 2/2 [00:00<00:00,  6.76it

[36m(_train_tune pid=13227)[0m /usr/local/lib/python3.10/dist-packages/ray/tune/integration/pytorch_lightning.py:198: `ray.tune.integration.pytorch_lightning.TuneReportCallback` is deprecated. Use `ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback` instead.
[36m(_train_tune pid=13227)[0m Seed set to 42
[36m(_train_tune pid=13227)[0m GPU available: True (cuda), used: True
[36m(_train_tune pid=13227)[0m TPU available: False, using: 0 TPU cores
[36m(_train_tune pid=13227)[0m HPU available: False, using: 0 HPUs
[36m(_train_tune pid=13227)[0m You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
[36m(_train_tune pid=13227)[0m 2024-11-18 13:25:51.941613: I t

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/13 [00:00<?, ?it/s] 
Epoch 1:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.60, train_loss_epoch=-1.58]
Epoch 2:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.37, train_loss_epoch=-1.75]
Epoch 3:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.20, train_loss_epoch=-1.79]
Epoch 4:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.66, train_loss_epoch=-1.80]
Epoch 5:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-2.15, train_loss_epoch=-1.87]
Epoch 6:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.81, train_loss_epoch=-1.83]
Epoch 7:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.87, train_loss_epoch=-1.85]
[36m(_train_tune pid=13227)[0m 
Validation: |          | 0/? [00:00<?, ?it/s][A
Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
Validation DataLoa

2024-11-18 13:26:15,947	INFO tensorboardx.py:308 -- Removed the following hyperparameter values when logging to tensorboard: {'hist_exog_list': ('DY', 'PTBV', 'P', 'PO', 'VO', 'PE'), 'loss': ('__ref_ph', 'de895953'), 'n_freq_downsample': (60, 8, 1), 'n_pool_kernel_size': (4, 4, 4), 'valid_loss': ('__ref_ph', '004b9a7a')}
2024-11-18 13:26:15,970	INFO tune.py:1009 -- Wrote the latest version of all result files and experiment state to '/root/ray_results/_train_tune_2024-11-18_13-03-34' in 0.0192s.
2024-11-18 13:26:15,973	ERROR tune.py:1037 -- Trials did not complete: [_train_tune_a76ac303, _train_tune_423843ea]


[36m(_train_tune pid=13227)[0m 
[36m(_train_tune pid=13227)[0m Validation: |          | 0/? [00:00<?, ?it/s][A
[36m(_train_tune pid=13227)[0m Validation:   0%|          | 0/13 [00:00<?, ?it/s][A
[36m(_train_tune pid=13227)[0m Validation DataLoader 0:   0%|          | 0/13 [00:00<?, ?it/s][A



[36m(_train_tune pid=13227)[0m `Trainer.fit` stopped: `max_steps=1100.0` reached.
INFO:lightning_fabric.utilities.seed:Seed set to 42
INFO:pytorch_lightning.utilities.rank_zero:GPU available: True (cuda), used: True
INFO:pytorch_lightning.utilities.rank_zero:TPU available: False, using: 0 TPU cores
INFO:pytorch_lightning.utilities.rank_zero:HPU available: False, using: 0 HPUs
INFO:pytorch_lightning.utilities.rank_zero:You are using a CUDA device ('NVIDIA A100-SXM4-40GB') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision


[36m(_train_tune pid=13227)[0m 
[36m(_train_tune pid=13227)[0m Validation DataLoader 0: 100%|██████████| 13/13 [00:00<00:00, 69.23it/s][A
[36m(_train_tune pid=13227)[0m                                                                         [AEpoch 84:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.92, train_loss_epoch=-2.16, valid_loss=-1.92]Epoch 84:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.92, train_loss_epoch=-2.15, valid_loss=-1.92]Epoch 84:   0%|          | 0/13 [00:00<?, ?it/s, v_num=0, train_loss_step=-1.92, train_loss_epoch=-2.15, valid_loss=-1.92]


INFO:pytorch_lightning.accelerators.cuda:LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
INFO:pytorch_lightning.callbacks.model_summary:
  | Name         | Type             | Params | Mode 
----------------------------------------------------------
0 | loss         | DistributionLoss | 3      | eval 
1 | padder_train | ConstantPad1d    | 0      | train
2 | scaler       | TemporalNorm     | 0      | train
3 | blocks       | ModuleList       | 2.8 M  | train
----------------------------------------------------------
2.8 M     Trainable params
3         Non-trainable params
2.8 M     Total params
11.288    Total estimated model params size (MB)
33        Modules in train mode
1         Modules in eval mode


Sanity Checking: |          | 0/? [00:00<?, ?it/s]

Training: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

Validation: |          | 0/? [00:00<?, ?it/s]

INFO:pytorch_lightning.utilities.rank_zero:`Trainer.fit` stopped: `max_steps=1200.0` reached.
INFO:pytorch_lightning.utilities.rank_zero:GPU available: True (cuda), used: True
INFO:pytorch_lightning.utilities.rank_zero:TPU available: False, using: 0 TPU cores
INFO:pytorch_lightning.utilities.rank_zero:HPU available: False, using: 0 HPUs
INFO:pytorch_lightning.accelerators.cuda:LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]


Predicting: |          | 0/? [00:00<?, ?it/s]

Horizon 20 CV Minutes: 24.180792804559072
