In [1]:
import wandb
from main import main
import ml_collections as mlc
import logging
import pytorch_lightning as pl
from pytorch_lightning import Trainer
from model import MInterface
from data import DInterface
from train_utils import load_logger, load_callbacks
from config.config import set_default_config
import yaml
import os

logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
DEFAULT_CONFIG = mlc.ConfigDict()
set_default_config(DEFAULT_CONFIG)
with open('config/egnn_cfg_sweep.yaml', 'r') as f:
    default_arg = yaml.safe_load(f)
DEFAULT_CONFIG.update(default_arg)
DEFAULT_CONFIG.log_dir = f'./log/sweep/{DEFAULT_CONFIG.pl_module.model_name}/{DEFAULT_CONFIG.pl_data_module.dataset}'
if not os.path.exists(DEFAULT_CONFIG.log_dir):
    os.makedirs(DEFAULT_CONFIG.log_dir)


In [2]:

def sweep_main():
    logging.info('seed everything')
    pl.seed_everything(DEFAULT_CONFIG.seed)
    if True:
        logging.info('Using wandb')
        wandb.init(project=DEFAULT_CONFIG.project, group=DEFAULT_CONFIG.group, save_code=True, dir=DEFAULT_CONFIG.log_dir, reinit=True)
        args = DEFAULT_CONFIG
        args.update_from_flattened_dict(vars(wandb.config)['_items'])
        # raise Exception
        wandb.config.update(args.pl_module.model.to_dict())
        wandb.config.update(args.to_dict())
    logging.info('Loading data and model')
    data_module = DInterface(**args.pl_data_module)
    model = MInterface(**args.pl_module)

    logging.info('loading callbacks and logger')
    args.trainer.callbacks = load_callbacks(args)
    args.trainer.logger = load_logger(args)
    
    logging.info('creating trainer')
    trainer = Trainer(**args.trainer)
    
    if args.trainer.auto_scale_batch_size:
        logging.info('start auto scale batch size')
        trainer.tune(model, data_module)

    logging.info('start training')
    trainer.fit(model, data_module)
    
    logging.info('start testing')
    trainer.test(model, data_module)



In [3]:
wandb.login(key='local-8fe6e6b5840c4c05aaaf6aac5ca8c1fb58abbd1f', host='http://localhost:8080')


2023-03-15 14:34:54,805 - ERROR - Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
[34m[1mwandb[0m: Currently logged in as: [33mhuabei[0m. Use [1m`wandb login --relogin`[0m to force relogin
[34m[1mwandb[0m: Appending key for localhost to your netrc file: /home/huabei/.netrc


True

In [4]:

# https://docs.wandb.ai/guides/sweeps/define-sweep-configuration
sweep_config = {
  "name" : "my-sweep",
  "method" : "random",
  "metric" : {'goal': 'minimize', 'name': 'val_loss'},
  "parameters" : {
    "pl_module.lr": {
      "distribution": "log_uniform_values",
      "min": 0.00001,
      "max": 0.001
    },
    # "pl_module.model.tanh": {
    #   "values": [True, False]
    # }
  }
}

sweep_id = wandb.sweep(sweep_config, project=DEFAULT_CONFIG.project)

Create sweep with ID: 08e5ghls
Sweep URL: http://localhost:8080/huabei/egnn-sweep/sweeps/08e5ghls


In [5]:
# %%wandb

count = 10 # number of runs to execute
wandb.agent(sweep_id, function=sweep_main, count=count)

2023-03-15 14:34:58,601 - INFO - Starting sweep agent: entity=None, project=None, count=10
[34m[1mwandb[0m: Agent Starting Run: vtc4ipuy with config:
[34m[1mwandb[0m: 	pl_module.lr: 2.374365506107818e-06
2023-03-15 14:34:58,745 - INFO - seed everything
Global seed set to 1234
2023-03-15 14:34:58,748 - INFO - Using wandb
2023-03-15 14:34:58,752 - ERROR - Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
在工作区中该文件仍保持原有的换行符


2023-03-15 14:35:06,281 - INFO - Loading data and model
2023-03-15 14:35:07,917 - INFO - loading callbacks and logger
  rank_zero_warn(
2023-03-15 14:35:07,947 - INFO - creating trainer
GPU available: True (cuda), used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
HPU available: False, using: 0 HPUs
2023-03-15 14:35:08,086 - INFO - start training
You are using a CUDA device ('NVIDIA GeForce RTX 3060') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
`Trainer.fit` stopped: `max_epochs=63` reached.
2023-03-15 15:00:40,895 - INFO - start testing
You are using a CUDA device ('NVIDIA GeForce RTX 3060') that has Tensor Cores. To properly utilize them, you shou

────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
       Test metric             DataLoader 0
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
        test_mae            0.3556353747844696
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────


VBox(children=(Label(value='8.007 MB of 8.007 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
global_step,▁▁▁
lr-Adam,███▇▂█▇▄▃▁██▇▆▅▄▃▂▂▁████▇▇▆▆▅▅▄▄▃▃▂▂▂▁▁▁
test_mae,▁
test_r2,▁
train_loss,█▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_mae,█▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_r2,▁
trainer/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
val_loss,█▄▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,63.0
global_step,39564.0
lr-Adam,0.0
test_mae,0.35564
test_r2,0.5584
train_loss,0.08919
train_mae,0.35797
train_r2,0.55613
trainer/global_step,39564.0
val_loss,0.09941


[34m[1mwandb[0m: Agent Starting Run: 9epwwl63 with config:
[34m[1mwandb[0m: 	pl_module.lr: 0.0007644679904092894
2023-03-15 15:00:49,441 - INFO - seed everything
Global seed set to 1234
2023-03-15 15:00:49,441 - INFO - Using wandb
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
在工作区中该文件仍保持原有的换行符


2023-03-15 15:00:56,913 - INFO - Loading data and model
2023-03-15 15:00:58,738 - INFO - loading callbacks and logger

There is a wandb run already in progress and newly created instances of `WandbLogger` will reuse this run. If this is not desired, call `wandb.finish()` before instantiating `WandbLogger`.

2023-03-15 15:00:58,739 - INFO - creating trainer
GPU available: True (cuda), used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
HPU available: False, using: 0 HPUs
2023-03-15 15:00:58,853 - INFO - start training
You are using a CUDA device ('NVIDIA GeForce RTX 3060') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
`Trainer.fit` stopped: `max_epochs=

────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
       Test metric             DataLoader 0
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
        test_mae            0.2204955816268921
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────


VBox(children=(Label(value='8.011 MB of 8.011 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
global_step,▁▁▁
lr-Adam,███▇▂█▇▄▃▁██▇▆▅▄▃▂▂▁████▇▇▆▆▅▅▄▄▃▃▂▂▂▁▁▁
test_mae,▁
test_r2,▁
train_loss,█▃▅▄▅▃▃▃▃▃▃▄▂▃▄▃▂▃▃▁▃▂▃▁▃▂▂▃▂▂▂▃▁▄▁▁▂▂▂▂
train_mae,█▄▃▃▃▃▃▂▂▂▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁
train_r2,▁
trainer/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
val_loss,█▅▄▄▃▃▃▃▂▂▂▂▃▂▂▂▁▂▁▁▂▂▂▂▁▁▃▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,63.0
global_step,39564.0
lr-Adam,0.0
test_mae,0.2205
test_r2,0.82564
train_loss,0.02753
train_mae,0.2088
train_r2,0.84409
trainer/global_step,39564.0
val_loss,0.03933


[34m[1mwandb[0m: Agent Starting Run: rus1cpzn with config:
[34m[1mwandb[0m: 	pl_module.lr: 7.66810266062985e-06
2023-03-15 15:27:02,625 - INFO - seed everything
Global seed set to 1234
2023-03-15 15:27:02,626 - INFO - Using wandb
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
在工作区中该文件仍保持原有的换行符


2023-03-15 15:27:09,955 - INFO - Loading data and model
2023-03-15 15:27:11,760 - INFO - loading callbacks and logger

There is a wandb run already in progress and newly created instances of `WandbLogger` will reuse this run. If this is not desired, call `wandb.finish()` before instantiating `WandbLogger`.

2023-03-15 15:27:11,762 - INFO - creating trainer
GPU available: True (cuda), used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
HPU available: False, using: 0 HPUs
2023-03-15 15:27:11,871 - INFO - start training
You are using a CUDA device ('NVIDIA GeForce RTX 3060') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
`Trainer.fit` stopped: `max_epochs=

────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
       Test metric             DataLoader 0
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
        test_mae            0.3093579113483429
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────


VBox(children=(Label(value='8.021 MB of 8.021 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
global_step,▁▁▁
lr-Adam,███▇▂█▇▄▃▁██▇▆▅▄▃▂▂▁████▇▇▆▆▅▅▄▄▃▃▂▂▂▁▁▁
test_mae,▁
test_r2,▁
train_loss,█▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_mae,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_r2,▁
trainer/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
val_loss,█▄▃▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,63.0
global_step,39564.0
lr-Adam,0.0
test_mae,0.30936
test_r2,0.66523
train_loss,0.06249
train_mae,0.31068
train_r2,0.66299
trainer/global_step,39564.0
val_loss,0.07521


[34m[1mwandb[0m: Agent Starting Run: 9t2qs9hr with config:
[34m[1mwandb[0m: 	pl_module.lr: 0.0005113576350965349
2023-03-15 15:52:55,963 - INFO - seed everything
Global seed set to 1234
2023-03-15 15:52:55,963 - INFO - Using wandb
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
在工作区中该文件仍保持原有的换行符


2023-03-15 15:53:03,025 - INFO - Loading data and model
2023-03-15 15:53:04,837 - INFO - loading callbacks and logger

There is a wandb run already in progress and newly created instances of `WandbLogger` will reuse this run. If this is not desired, call `wandb.finish()` before instantiating `WandbLogger`.

2023-03-15 15:53:04,839 - INFO - creating trainer
GPU available: True (cuda), used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
HPU available: False, using: 0 HPUs
2023-03-15 15:53:04,936 - INFO - start training
You are using a CUDA device ('NVIDIA GeForce RTX 3060') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
`Trainer.fit` stopped: `max_epochs=

────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
       Test metric             DataLoader 0
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
        test_mae            0.22231851518154144
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────


VBox(children=(Label(value='8.026 MB of 8.026 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
global_step,▁▁▁
lr-Adam,███▇▂█▇▄▃▁██▇▆▅▄▃▂▂▁████▇▇▆▆▅▅▄▄▃▃▂▂▂▁▁▁
test_mae,▁
test_r2,▁
train_loss,█▃▅▄▅▃▂▃▃▃▃▅▂▂▄▂▂▃▃▁▃▂▃▂▃▂▃▄▂▂▂▃▁▃▁▁▂▂▂▂
train_mae,█▄▃▃▂▃▃▂▂▂▂▂▂▂▂▂▂▂▁▁▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_r2,▁
trainer/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
val_loss,█▄▄▄▃▃▃▃▂▂▃▂▂▂▂▂▁▂▁▁▂▂▂▂▁▂▂▁▁▂▁▁▁▁▁▁▁▁▁▁

0,1
epoch,63.0
global_step,39564.0
lr-Adam,0.0
test_mae,0.22232
test_r2,0.82277
train_loss,0.02748
train_mae,0.21599
train_r2,0.83341
trainer/global_step,39564.0
val_loss,0.0404


[34m[1mwandb[0m: Agent Starting Run: yutsquqs with config:
[34m[1mwandb[0m: 	pl_module.lr: 1.353741946668555e-05
2023-03-15 16:19:04,958 - INFO - seed everything
Global seed set to 1234
2023-03-15 16:19:04,959 - INFO - Using wandb
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
在工作区中该文件仍保持原有的换行符


2023-03-15 16:19:12,298 - INFO - Loading data and model
2023-03-15 16:19:14,147 - INFO - loading callbacks and logger

There is a wandb run already in progress and newly created instances of `WandbLogger` will reuse this run. If this is not desired, call `wandb.finish()` before instantiating `WandbLogger`.

2023-03-15 16:19:14,151 - INFO - creating trainer
GPU available: True (cuda), used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
HPU available: False, using: 0 HPUs
2023-03-15 16:19:14,276 - INFO - start training
You are using a CUDA device ('NVIDIA GeForce RTX 3060') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
`Trainer.fit` stopped: `max_epochs=

────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
       Test metric             DataLoader 0
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
        test_mae            0.2883140742778778
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────


VBox(children=(Label(value='8.035 MB of 8.035 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
global_step,▁▁▁
lr-Adam,███▇▂█▇▄▃▁██▇▆▅▄▃▂▂▁████▇▇▆▆▅▅▄▄▃▃▂▂▂▁▁▁
test_mae,▁
test_r2,▁
train_loss,█▃▄▃▃▃▂▃▃▃▂▂▂▂▂▂▂▂▂▂▂▃▂▁▂▂▁▂▂▂▂▂▁▂▁▂▁▂▁▁
train_mae,█▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_r2,▁
trainer/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
val_loss,█▆▄▄▄▃▃▃▃▃▃▃▂▃▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,63.0
global_step,39564.0
lr-Adam,0.0
test_mae,0.28831
test_r2,0.70745
train_loss,0.05418
train_mae,0.28949
train_r2,0.70542
trainer/global_step,39564.0
val_loss,0.06573


[34m[1mwandb[0m: Agent Starting Run: jigahqod with config:
[34m[1mwandb[0m: 	pl_module.lr: 6.3849204104305864e-06
2023-03-15 16:45:13,845 - INFO - seed everything
Global seed set to 1234
2023-03-15 16:45:13,847 - INFO - Using wandb
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
在工作区中该文件仍保持原有的换行符


2023-03-15 16:45:21,275 - INFO - Loading data and model
2023-03-15 16:45:23,249 - INFO - loading callbacks and logger

There is a wandb run already in progress and newly created instances of `WandbLogger` will reuse this run. If this is not desired, call `wandb.finish()` before instantiating `WandbLogger`.

2023-03-15 16:45:23,253 - INFO - creating trainer
GPU available: True (cuda), used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
HPU available: False, using: 0 HPUs
2023-03-15 16:45:23,371 - INFO - start training
You are using a CUDA device ('NVIDIA GeForce RTX 3060') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
`Trainer.fit` stopped: `max_epochs=

────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
       Test metric             DataLoader 0
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
        test_mae            0.3174159526824951
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────


VBox(children=(Label(value='8.044 MB of 8.044 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
global_step,▁▁▁
lr-Adam,███▇▂█▇▄▃▁██▇▆▅▄▃▂▂▁████▇▇▆▆▅▅▄▄▃▃▂▂▂▁▁▁
test_mae,▁
test_r2,▁
train_loss,█▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_mae,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_r2,▁
trainer/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
val_loss,█▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,63.0
global_step,39564.0
lr-Adam,0.0
test_mae,0.31742
test_r2,0.64788
train_loss,0.06688
train_mae,0.31879
train_r2,0.64571
trainer/global_step,39564.0
val_loss,0.07921


[34m[1mwandb[0m: Agent Starting Run: fmgpr9ez with config:
[34m[1mwandb[0m: 	pl_module.lr: 2.554529586164634e-05
2023-03-15 17:11:22,695 - INFO - seed everything
Global seed set to 1234
2023-03-15 17:11:22,696 - INFO - Using wandb
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
在工作区中该文件仍保持原有的换行符


2023-03-15 17:11:29,985 - INFO - Loading data and model
2023-03-15 17:11:31,864 - INFO - loading callbacks and logger

There is a wandb run already in progress and newly created instances of `WandbLogger` will reuse this run. If this is not desired, call `wandb.finish()` before instantiating `WandbLogger`.

2023-03-15 17:11:31,866 - INFO - creating trainer
GPU available: True (cuda), used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
HPU available: False, using: 0 HPUs
2023-03-15 17:11:31,987 - INFO - start training
You are using a CUDA device ('NVIDIA GeForce RTX 3060') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
`Trainer.fit` stopped: `max_epochs=

────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
       Test metric             DataLoader 0
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
        test_mae            0.26845356822013855
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────


VBox(children=(Label(value='8.053 MB of 8.053 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
global_step,▁▁▁
lr-Adam,███▇▂█▇▄▃▁██▇▆▅▄▃▂▂▁████▇▇▆▆▅▅▄▄▃▃▂▂▂▁▁▁
test_mae,▁
test_r2,▁
train_loss,█▅▆▅▅▄▃▅▄▄▃▄▃▃▄▃▂▄▂▃▃▃▃▃▃▂▂▃▂▂▂▂▁▃▂▂▂▂▂▂
train_mae,█▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_r2,▁
trainer/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
val_loss,█▆▅▅▄▄▄▃▃▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▁▂▁▂▁▂▂▁▁▁▁▁▁▁▁▁

0,1
epoch,63.0
global_step,39564.0
lr-Adam,0.0
test_mae,0.26845
test_r2,0.7448
train_loss,0.04669
train_mae,0.26876
train_r2,0.74436
trainer/global_step,39564.0
val_loss,0.05751


[34m[1mwandb[0m: Agent Starting Run: piphqxba with config:
[34m[1mwandb[0m: 	pl_module.lr: 1.1093810130544112e-06
2023-03-15 17:37:07,833 - INFO - seed everything
Global seed set to 1234
2023-03-15 17:37:07,833 - INFO - Using wandb
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
在工作区中该文件仍保持原有的换行符


2023-03-15 17:37:15,192 - INFO - Loading data and model
2023-03-15 17:37:16,993 - INFO - loading callbacks and logger

There is a wandb run already in progress and newly created instances of `WandbLogger` will reuse this run. If this is not desired, call `wandb.finish()` before instantiating `WandbLogger`.

2023-03-15 17:37:16,995 - INFO - creating trainer
GPU available: True (cuda), used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
HPU available: False, using: 0 HPUs
2023-03-15 17:37:17,109 - INFO - start training
You are using a CUDA device ('NVIDIA GeForce RTX 3060') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
`Trainer.fit` stopped: `max_epochs=

────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
       Test metric             DataLoader 0
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
        test_mae            0.3763151466846466
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────


VBox(children=(Label(value='8.061 MB of 8.061 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
global_step,▁▁▁
lr-Adam,███▇▂█▇▄▃▁██▇▆▅▄▃▂▂▁████▇▇▆▆▅▅▄▄▃▃▂▂▂▁▁▁
test_mae,▁
test_r2,▁
train_loss,█▅▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_mae,█▆▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_r2,▁
trainer/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
val_loss,█▅▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,63.0
global_step,39564.0
lr-Adam,0.0
test_mae,0.37632
test_r2,0.50773
train_loss,0.09971
train_mae,0.37856
train_r2,0.50429
trainer/global_step,39564.0
val_loss,0.11023


[34m[1mwandb[0m: Agent Starting Run: kxblayag with config:
[34m[1mwandb[0m: 	pl_module.lr: 1.5610944677887784e-06
2023-03-15 18:02:56,068 - INFO - seed everything
Global seed set to 1234
2023-03-15 18:02:56,069 - INFO - Using wandb
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
在工作区中该文件仍保持原有的换行符


2023-03-15 18:03:03,552 - INFO - Loading data and model
2023-03-15 18:03:05,432 - INFO - loading callbacks and logger

There is a wandb run already in progress and newly created instances of `WandbLogger` will reuse this run. If this is not desired, call `wandb.finish()` before instantiating `WandbLogger`.

2023-03-15 18:03:05,435 - INFO - creating trainer
GPU available: True (cuda), used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
HPU available: False, using: 0 HPUs
2023-03-15 18:03:05,565 - INFO - start training
You are using a CUDA device ('NVIDIA GeForce RTX 3060') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
`Trainer.fit` stopped: `max_epochs=

────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
       Test metric             DataLoader 0
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
        test_mae            0.36788666248321533
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────


VBox(children=(Label(value='8.066 MB of 8.066 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
global_step,▁▁▁
lr-Adam,███▇▂█▇▄▃▁██▇▆▅▄▃▂▂▁████▇▇▆▆▅▅▄▄▃▃▂▂▂▁▁▁
test_mae,▁
test_r2,▁
train_loss,█▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_mae,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_r2,▁
trainer/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
val_loss,█▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,63.0
global_step,39564.0
lr-Adam,0.0
test_mae,0.36789
test_r2,0.52842
train_loss,0.09517
train_mae,0.3703
train_r2,0.52548
trainer/global_step,39564.0
val_loss,0.1058


[34m[1mwandb[0m: Agent Starting Run: s6c7bizi with config:
[34m[1mwandb[0m: 	pl_module.lr: 0.00024657458195004
2023-03-15 18:28:49,144 - INFO - seed everything
Global seed set to 1234
2023-03-15 18:28:49,145 - INFO - Using wandb
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
在工作区中该文件仍保持原有的换行符


2023-03-15 18:28:56,467 - INFO - Loading data and model
2023-03-15 18:28:58,262 - INFO - loading callbacks and logger

There is a wandb run already in progress and newly created instances of `WandbLogger` will reuse this run. If this is not desired, call `wandb.finish()` before instantiating `WandbLogger`.

2023-03-15 18:28:58,264 - INFO - creating trainer
GPU available: True (cuda), used: True
TPU available: False, using: 0 TPU cores
IPU available: False, using: 0 IPUs
HPU available: False, using: 0 HPUs
2023-03-15 18:28:58,369 - INFO - start training
You are using a CUDA device ('NVIDIA GeForce RTX 3060') that has Tensor Cores. To properly utilize them, you should set `torch.set_float32_matmul_precision('medium' | 'high')` which will trade-off precision for performance. For more details, read https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
`Trainer.fit` stopped: `max_epochs=

────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
       Test metric             DataLoader 0
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
        test_mae            0.22933407127857208
────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────


VBox(children=(Label(value='8.073 MB of 8.073 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
global_step,▁▁▁
lr-Adam,███▇▂█▇▄▃▁██▇▆▅▄▃▂▂▁████▇▇▆▆▅▅▄▄▃▃▂▂▂▁▁▁
test_mae,▁
test_r2,▁
train_loss,█▄▄▅▆▄▃▄▃▃▄▅▃▃▅▃▂▃▃▂▄▃▃▁▄▃▃▄▂▃▂▃▁▃▂▁▂▂▂▂
train_mae,█▄▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train_r2,▁
trainer/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
val_loss,█▅▄▃▃▃▃▃▂▂▂▂▃▂▂▂▂▂▂▂▂▂▂▂▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,63.0
global_step,39564.0
lr-Adam,0.0
test_mae,0.22933
test_r2,0.81307
train_loss,0.03222
train_mae,0.22735
train_r2,0.81582
trainer/global_step,39564.0
val_loss,0.04228
