# Value gradient error for linear policies in LQG

Experiment description on [Overleaf](https://www.overleaf.com/read/cmbgmxxpxqzr).

**Versioning:** [CalVer](https://calver.org) `MM.DD.MICRO`

In [1]:
from __future__ import annotations

import logging
import os
import os.path as osp

import lqsvg
import lqsvg.envs.lqr.utils as lqg_util
import lqsvg.experiment.utils as utils
import lqsvg.torch.named as nt
import pytorch_lightning as pl
import ray
from lqsvg.experiment.data import build_datamodule
from lqsvg.experiment.models import LightningModel
from lqsvg.experiment.worker import make_worker
from ray import tune
from raylab.policy.model_based.lightning import LightningTrainerSpec
from torch import Tensor

import wandb

In [2]:
CWD = os.getcwd()

In [3]:
class InputStatistics(pl.callbacks.Callback):
    def on_train_batch_end(
        self,
        trainer: pl.Trainer,
        pl_module: pl.LightningModule,
        outputs: Tensor,
        batch: tuple[Tensor, Tensor, Tensor],
        batch_idx: int,
        dataloader_idx: int,
    ):
        del trainer, outputs, batch_idx, dataloader_idx
        obs, act, new_obs = batch
        pl_module.log("train/obs-mean", obs.mean())
        pl_module.log("train/obs-std", obs.std())
        pl_module.log("train/act-mean", act.mean())
        pl_module.log("train/act-std", act.std())
        pl_module.log("train/new_obs-mean", new_obs.mean())
        pl_module.log("train/new_obs-std", new_obs.std())

In [4]:
class Experiment(tune.Trainable):
    def setup(self, config: dict):
        self.run = wandb.init(
            dir=osp.join(CWD, ""),
            name="SVG Prediction",
            config=config,
            project="LQG-SVG",
            entity="angelovtt",
            tags=[utils.calver()],
            reinit=True,
            mode="online",
            save_code=True,
        )

        self.make_worker()
        self.make_model()
        self.make_datamodule()
        self.make_lightning_trainer()
        self.make_artifact()
        utils.suppress_lightning_info_logging()

    @property
    def hparams(self):
        return self.run.config

    def make_worker(self):
        with nt.suppress_named_tensor_warning():
            self.worker = make_worker(
                env_config=self.hparams.env_config,
                policy_config=self.hparams.policy,
                log_level=logging.WARNING,
            )

    def make_model(self):
        self.model = LightningModel(self.worker.get_policy(), self.worker.env)
        self.model.hparams.learning_rate = self.hparams.learning_rate
        self.model.hparams.mc_samples = self.hparams.mc_samples
        self.model.hparams.weight_decay = self.hparams.weight_decay

    def make_datamodule(self):
        self.datamodule = build_datamodule(
            self.worker, total_trajs=self.hparams.total_trajs
        )
        self.datamodule.collect_trajectories(prog=False)

    def make_lightning_trainer(self):
        logger = pl.loggers.WandbLogger(
            save_dir=self.run.dir, log_model=False, experiment=self.run
        )

        early_stopping = pl.callbacks.EarlyStopping(
            monitor=LightningModel.early_stop_on,
            min_delta=float(self.hparams.improvement_delta),
            patience=int(self.hparams.patience),
            mode="min",
            strict=True,
        )
        checkpointing = pl.callbacks.ModelCheckpoint(
            dirpath=osp.join(self.run.dir, "checkpoints"),
            monitor=LightningModel.early_stop_on,
            save_top_k=-1,
            period=10,
            save_last=True,
        )
        self.trainer = pl.Trainer(
            default_root_dir=self.run.dir,
            logger=logger,
            num_sanity_val_steps=2,
            callbacks=[early_stopping, checkpointing, InputStatistics()],
            max_epochs=self.hparams.max_epochs,
            progress_bar_refresh_rate=0,  # don't show progress bar for model training
            weights_summary=None,  # don't print summary before training
        )

    def make_artifact(self):
        env = self.worker.env
        self.artifact = wandb.Artifact(
            f"svg_prediction-lqg{env.n_state}.{env.n_ctrl}.{env.horizon}", type="model"
        )

    def step(self) -> dict:
        self.log_env_info()
        with utils.suppress_dataloader_warning():
            self.trainer.fit(self.model, datamodule=self.datamodule)

            results = self.trainer.test(self.model, datamodule=self.datamodule)[0]
            self.run.summary.update(results)

        self.artifact.add_dir(self.trainer.checkpoint_callback.dirpath)
        self.run.log_artifact(self.artifact)
        return {tune.result.DONE: True, **results}

    def log_env_info(self):
        dynamics = self.worker.env.dynamics
        eigvals = lqg_util.stationary_eigvals(dynamics)
        tests = {
            "stability": lqg_util.isstable(eigvals=eigvals),
            "controllability": lqg_util.iscontrollable(dynamics),
        }
        self.run.summary.update(tests)
        self.run.summary.update({"Fs_eigvals": wandb.Histogram(eigvals)})

    def cleanup(self):
        self.run.finish()

In [5]:
ray.init(logging_level=logging.WARNING)
lqsvg.register_all()
utils.suppress_lightning_info_logging()

config = {
    "env_config": dict(
        n_state=2,
        n_ctrl=2,
        horizon=20,
        stationary=True,
        Fs_eigval_range=(0.0, 1.0),
        transition_bias=False,
        num_envs=100,
    ),
    "policy": {
        "module": {
            "policy_initializer": "xavier_uniform",
            "model_initializer": "xavier_uniform",
            "stationary_model": True,
            "model_input_norm": tune.grid_search([True, False]),
        }
    },
    "learning_rate": 1e-3,
    "weight_decay": 1e-4,
    "mc_samples": 32,
    "total_trajs": 1000,
    "improvement_delta": 0.0,
    "patience": 3,
    "max_epochs": 1000,
}

analysis = tune.run(Experiment, config=config, num_samples=8, local_dir="./results")

Trial name,status,loc,policy/module/model_input_norm
Experiment_a089f_00000,RUNNING,,True


[2m[36m(pid=14001)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14002)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14004)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14003)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14004)[0m wandb: ERROR Error while calling W&B API: Error 1213: Deadlock found when trying to get lock; try restarting transaction (<Response [500]>)
[2m[36m(pid=14001)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14001)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14001)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid=14001)[0m wandb: 🚀 View run at https://wandb.ai/angelovtt/LQG-SVG/runs/9vib5hut
[2m[36m(pid=14001)[0m wandb: Run data is saved locally in /Users/ang

[2m[36m(pid=14001)[0m 
[2m[36m(pid=14003)[0m 
[2m[36m(pid=14002)[0m 


[2m[36m(pid=14004)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14004)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14004)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid=14004)[0m wandb: 🚀 View run at https://wandb.ai/angelovtt/LQG-SVG/runs/3dfzmi0p
[2m[36m(pid=14004)[0m wandb: Run data is saved locally in /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163106-3dfzmi0p
[2m[36m(pid=14004)[0m wandb: Run `wandb offline` to turn off syncing.


[2m[36m(pid=14004)[0m 


[2m[36m(pid=14001)[0m GPU available: False, used: False
[2m[36m(pid=14001)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14001)[0m 2021-03-25 16:31:15,781	INFO trainable.py:100 -- Trainable.setup took 10.691 seconds. If your trainable is slow to initialize, consider setting reuse_actors=True to reduce actor creation overheads.
[2m[36m(pid=14003)[0m GPU available: False, used: False
[2m[36m(pid=14003)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14003)[0m 2021-03-25 16:31:15,813	INFO trainable.py:100 -- Trainable.setup took 10.722 seconds. If your trainable is slow to initialize, consider setting reuse_actors=True to reduce actor creation overheads.
[2m[36m(pid=14002)[0m GPU available: False, used: False
[2m[36m(pid=14002)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14002)[0m 2021-03-25 16:31:15,853	INFO trainable.py:100 -- Trainable.setup took 10.763 seconds. If your trainable is slow to initialize, consider setting reuse_actors=

[2m[36m(pid=14004)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14004)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14004)[0m {'test/analytic_cossim': tensor(0.5690),
[2m[36m(pid=14004)[0m  'test/analytic_diff': tensor(0.0013),
[2m[36m(pid=14004)[0m  'test/analytic_svg_norm': tensor(84.8707),
[2m[36m(pid=14004)[0m  'test/analytic_value': tensor(-134.0732),
[2m[36m(pid=14004)[0m  'test/loss': tensor(58.3978),
[2m[36m(pid=14004)[0m  'test/monte_carlo_cossim': tensor(0.4906),
[2m[36m(pid=14004)[0m  'test/monte_carlo_diff': tensor(14.5812),
[2m[36m(pid=14004)[0m  'test/monte_carlo_svg_norm': tensor(64.8805),
[2m[36m(pid=14004)[0m  'test/monte_carlo_value': tensor(-119.4933),
[2m[36m(pid=14004)[0m  'true_svg_norm': tensor(124.1702),
[2m[36m(pid=14004)[0m  'true_value': tensor(-134.0745)}
[2m[36m(pid=14004)[0m --------------------------------------------------------------------------------


[2m[36m(pid=14004)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163106-3dfzmi0p/files/checkpoints)... 
[2m[36m(pid=14004)[0m Done. 0.0s


Result for Experiment_a089f_00002:
  date: 2021-03-25_16-32-53
  done: true
  experiment_id: abe16ab775be444e8ae99f23af739996
  hostname: Angelos-MBP
  iterations_since_restore: 1
  node_ip: 192.168.15.11
  pid: 14004
  test/analytic_cossim: 0.56901615858078
  test/analytic_diff: 0.001312255859375
  test/analytic_svg_norm: 84.87065887451172
  test/analytic_value: -134.0731964111328
  test/loss: 58.39779281616211
  test/monte_carlo_cossim: 0.49063989520072937
  test/monte_carlo_diff: 14.5811767578125
  test/monte_carlo_svg_norm: 64.8805160522461
  test/monte_carlo_value: -119.49333190917969
  time_since_restore: 96.49288702011108
  time_this_iter_s: 96.49288702011108
  time_total_s: 96.49288702011108
  timestamp: 1616700773
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: a089f_00002
  true_svg_norm: 124.17015075683594
  true_value: -134.0745086669922
  


Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00000,RUNNING,,True,,,,,
Experiment_a089f_00001,RUNNING,,False,,,,,
Experiment_a089f_00003,RUNNING,,False,,,,,
Experiment_a089f_00004,PENDING,,True,,,,,
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17


[2m[36m(pid=14004)[0m wandb: Waiting for W&B process to finish, PID 14043
[2m[36m(pid=14004)[0m wandb: Program ended successfully.
[2m[36m(pid=14004)[0m wandb: - 8.42MB of 8.42MB uploaded (0.00MB deduped)
[2m[36m(pid=14004)[0m wandb: \ 9.14MB of 9.14MB uploaded (0.00MB deduped)
wandb:                                                                                


[2m[36m(pid=14003)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14003)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14003)[0m {'test/analytic_cossim': tensor(0.6906),
[2m[36m(pid=14003)[0m  'test/analytic_diff': tensor(-4.6016),
[2m[36m(pid=14003)[0m  'test/analytic_svg_norm': tensor(1194.6957),
[2m[36m(pid=14003)[0m  'test/analytic_value': tensor(-599.3182),
[2m[36m(pid=14003)[0m  'test/loss': 
[2m[36m(pid=14003)[0m tensor(64.4763),
[2m[36m(pid=14003)[0m  'test/monte_carlo_cossim': tensor(0.6746),
[2m[36m(pid=14003)[0m  'test/monte_carlo_diff': tensor(-34.9645),
[2m[36m(pid=14003)[0m  'test/monte_carlo_svg_norm': tensor(1276.4805),
[2m[36m(pid=14003)[0m  'test/monte_carlo_value': tensor(-629.6812),
[2m[36m(pid=14003)[0m  'true_svg_norm': tensor(1737.4231),
[2m[36m(pid=14003)[0m  'true_value': tensor(-594.7166)}
[2m[36m(pid=14003)[0m --------------------------------------------------------------

[2m[36m(pid=14003)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163106-3kzuvf0p/files/checkpoints)... 
[2m[36m(pid=14003)[0m Done. 0.1s


Result for Experiment_a089f_00000:
  date: 2021-03-25_16-33-01
  done: true
  experiment_id: b6b11679cc4841048b38344124b922c9
  hostname: Angelos-MBP
  iterations_since_restore: 1
  node_ip: 192.168.15.11
  pid: 14003
  test/analytic_cossim: 0.6906058192253113
  test/analytic_diff: -4.60162353515625
  test/analytic_svg_norm: 1194.6956787109375
  test/analytic_value: -599.3182373046875
  test/loss: 64.47628784179688
  test/monte_carlo_cossim: 0.6746143698692322
  test/monte_carlo_diff: -34.96453857421875
  test/monte_carlo_svg_norm: 1276.48046875
  test/monte_carlo_value: -629.68115234375
  time_since_restore: 105.79777097702026
  time_this_iter_s: 105.79777097702026
  time_total_s: 105.79777097702026
  timestamp: 1616700781
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: a089f_00000
  true_svg_norm: 1737.423095703125
  true_value: -594.7166137695312
  


Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00001,RUNNING,,False,,,,,
Experiment_a089f_00003,RUNNING,,False,,,,,
Experiment_a089f_00004,RUNNING,,True,,,,,
Experiment_a089f_00005,PENDING,,False,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17


[2m[36m(pid=14004)[0m 


[2m[36m(pid=14003)[0m wandb: Waiting for W&B process to finish, PID 14046
[2m[36m(pid=14003)[0m wandb: Program ended successfully.
[2m[36m(pid=14004)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163106-3dfzmi0p/logs/debug.log
[2m[36m(pid=14004)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163106-3dfzmi0p/logs/debug-internal.log
[2m[36m(pid=14004)[0m wandb: Run summary:
[2m[36m(pid=14004)[0m wandb:                   stability True
[2m[36m(pid=14004)[0m wandb:             controllability True
[2m[36m(pid=14004)[0m wandb:                    val/loss 58.79763
[2m[36m(pid=14004)[0m wandb:       val/monte_carlo_value -110.50595
[2m[36m(pid=14004)[0m wandb:    val/monte_carlo_svg_norm 55.04731
[2m[36m(pid=14004)[0m wandb:        val/monte_carlo_diff 23.56856
[2m[36m(pid=14004)[0m wandb:      val/mo

[2m[36m(pid=14003)[0m 


[2m[36m(pid=14153)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14001)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163106-9vib5hut/files/checkpoints)... 
[2m[36m(pid=14001)[0m Done. 0.0s


[2m[36m(pid=14001)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14001)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14001)[0m {'test/analytic_cossim': tensor(0.6221),
[2m[36m(pid=14001)[0m  'test/analytic_diff': tensor(0.9856),
[2m[36m(pid=14001)[0m  'test/analytic_svg_norm': tensor(61.6784),
[2m[36m(pid=14001)[0m  'test/analytic_value': tensor(-89.8831),
[2m[36m(pid=14001)[0m  'test/loss': tensor(59.1285),
[2m[36m(pid=14001)[0m  'test/monte_carlo_cossim': tensor(0.5871),
[2m[36m(pid=14001)[0m  'test/monte_carlo_diff': tensor(5.2317),
[2m[36m(pid=14001)[0m  'test/monte_carlo_svg_norm': tensor(55.8809),
[2m[36m(pid=14001)[0m  'test/monte_carlo_value': tensor(-85.6370),
[2m[36m(pid=14001)[0m  'true_svg_norm': tensor(74.5132),
[2m[36m(pid=14001)[0m  'true_value': tensor(-90.8687)}
[2m[36m(pid=14001)[0m --------------------------------------------------------------------------------
Result for Experime

Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00001,RUNNING,,False,,,,,
Experiment_a089f_00004,RUNNING,,True,,,,,
Experiment_a089f_00005,RUNNING,,False,,,,,
Experiment_a089f_00006,PENDING,,True,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132


[2m[36m(pid=14153)[0m 


[2m[36m(pid=14001)[0m wandb: Waiting for W&B process to finish, PID 14045
[2m[36m(pid=14001)[0m wandb: Program ended successfully.
[2m[36m(pid=14153)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14153)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14153)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid=14153)[0m wandb: 🚀 View run at https://wandb.ai/angelovtt/LQG-SVG/runs/2umibr2x
[2m[36m(pid=14153)[0m wandb: Run data is saved locally in /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163311-2umibr2x
[2m[36m(pid=14153)[0m wandb: Run `wandb offline` to turn off syncing.
[2m[36m(pid=14165)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14001)[0m wandb: - 8.61MB of 8.61MB uploaded (0.00MB deduped)
[2m[36m(pid=14001)[0m wandb: \ 9.51MB of 9.51MB uploaded (0.00MB deduped)
[2m[36m(pid=14153)[0m GPU available: False, used:

[2m[36m(pid=14165)[0m 


wandb:                                                                                
[2m[36m(pid=14001)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163106-9vib5hut/logs/debug.log
[2m[36m(pid=14001)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163106-9vib5hut/logs/debug-internal.log
[2m[36m(pid=14001)[0m wandb: Run summary:
[2m[36m(pid=14001)[0m wandb:                   stability True
[2m[36m(pid=14001)[0m wandb:             controllability True
[2m[36m(pid=14001)[0m wandb:                    val/loss 58.80008
[2m[36m(pid=14001)[0m wandb:       val/monte_carlo_value -99.54904
[2m[36m(pid=14001)[0m wandb:    val/monte_carlo_svg_norm 73.20168
[2m[36m(pid=14001)[0m wandb:        val/monte_carlo_diff -8.68037
[2m[36m(pid=14001)[0m wandb:      val/monte_carlo_cossim 0.63138
[2m[36m(pid=14001)[0m w

[2m[36m(pid=14001)[0m 


[2m[36m(pid=14165)[0m GPU available: False, used: False
[2m[36m(pid=14165)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14221)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14221)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14221)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14221)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid=14221)[0m wandb: 🚀 View run at https://wandb.ai/angelovtt/LQG-SVG/runs/2xu2jguf
[2m[36m(pid=14221)[0m wandb: Run data is saved locally in /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163329-2xu2jguf
[2m[36m(pid=14221)[0m wandb: Run `wandb offline` to turn off syncing.


[2m[36m(pid=14221)[0m 


[2m[36m(pid=14221)[0m GPU available: False, used: False
[2m[36m(pid=14221)[0m TPU available: None, using: 0 TPU cores


[2m[36m(pid=14002)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14002)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14002)[0m {'test/analytic_cossim': tensor(0.7894),
[2m[36m(pid=14002)[0m  'test/analytic_diff': 
[2m[36m(pid=14002)[0m tensor(-0.1457),
[2m[36m(pid=14002)[0m  'test/analytic_svg_norm': tensor(54.9142),
[2m[36m(pid=14002)[0m  
[2m[36m(pid=14002)[0m 'test/analytic_value': tensor(-65.7487),
[2m[36m(pid=14002)[0m  'test/loss': tensor(65.3520)
[2m[36m(pid=14002)[0m ,
[2m[36m(pid=14002)[0m  'test/monte_carlo_cossim': tensor(0.7619),
[2m[36m(pid=14002)[0m  'test/monte_carlo_diff': 
[2m[36m(pid=14002)[0m tensor(-2.3216),
[2m[36m(pid=14002)[0m  'test/monte_carlo_svg_norm': 
[2m[36m(pid=14002)[0m tensor(56.8384),
[2m[36m(pid=14002)[0m  'test/monte_carlo_value': 
[2m[36m(pid=14002)[0m tensor(-67.9247),
[2m[36m(pid=14002)[0m  'true_svg_norm': tensor(89.1708),
[2m[36m(pid=14002)[0m 

[2m[36m(pid=14002)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163106-1ew0t77s/files/checkpoints)... 
[2m[36m(pid=14002)[0m Done. 0.1s


Result for Experiment_a089f_00001:
  date: 2021-03-25_16-33-53
  done: true
  experiment_id: afc7a964ae11451ca216664be0bba6fa
  hostname: Angelos-MBP
  iterations_since_restore: 1
  node_ip: 192.168.15.11
  pid: 14002
  test/analytic_cossim: 0.7893773913383484
  test/analytic_diff: -0.14565277099609375
  test/analytic_svg_norm: 54.91423416137695
  test/analytic_value: -65.74874114990234
  test/loss: 65.35197448730469
  test/monte_carlo_cossim: 0.7619448304176331
  test/monte_carlo_diff: -2.3215789794921875
  test/monte_carlo_svg_norm: 56.83843994140625
  test/monte_carlo_value: -67.92466735839844
  time_since_restore: 157.19400906562805
  time_this_iter_s: 157.19400906562805
  time_total_s: 157.19400906562805
  timestamp: 1616700833
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: a089f_00001
  true_svg_norm: 89.1707534790039
  true_value: -65.60308837890625
  


Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00004,RUNNING,,True,,,,,
Experiment_a089f_00005,RUNNING,,False,,,,,
Experiment_a089f_00006,RUNNING,,True,,,,,
Experiment_a089f_00007,PENDING,,False,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1.0,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132


[2m[36m(pid=14002)[0m wandb: Waiting for W&B process to finish, PID 14044
[2m[36m(pid=14002)[0m wandb: Program ended successfully.
[2m[36m(pid=14002)[0m wandb: - 8.86MB of 8.86MB uploaded (0.00MB deduped)
[2m[36m(pid=14002)[0m wandb: \ 9.50MB of 10.02MB uploaded (0.00MB deduped)
wandb:                                                                                
[2m[36m(pid=14002)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163106-1ew0t77s/logs/debug.log
[2m[36m(pid=14002)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163106-1ew0t77s/logs/debug-internal.log
[2m[36m(pid=14002)[0m wandb: Run summary:
[2m[36m(pid=14002)[0m wandb:                   stability True
[2m[36m(pid=14002)[0m wandb:             controllability True
[2m[36m(pid=14002)[0m wandb:                    val/loss 65.8058
[2m[36m(p

[2m[36m(pid=14002)[0m 


[2m[36m(pid=14255)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14255)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14255)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14255)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid=14255)[0m wandb: 🚀 View run at https://wandb.ai/angelovtt/LQG-SVG/runs/2ormee86
[2m[36m(pid=14255)[0m wandb: Run data is saved locally in /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163410-2ormee86
[2m[36m(pid=14255)[0m wandb: Run `wandb offline` to turn off syncing.


[2m[36m(pid=14255)[0m 


[2m[36m(pid=14255)[0m GPU available: False, used: False
[2m[36m(pid=14255)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14153)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163311-2umibr2x/files/checkpoints)... 
[2m[36m(pid=14153)[0m Done. 0.0s


[2m[36m(pid=14153)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14153)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14153)[0m {'test/analytic_cossim': tensor(0.6636),
[2m[36m(pid=14153)[0m  'test/analytic_diff': tensor(3.9228),
[2m[36m(pid=14153)[0m  'test/analytic_svg_norm': tensor(23.0708),
[2m[36m(pid=14153)[0m  'test/analytic_value': tensor(-60.5743),
[2m[36m(pid=14153)[0m  'test/loss': tensor(48.9358),
[2m[36m(pid=14153)[0m  'test/monte_carlo_cossim': tensor(0.6542),
[2m[36m(pid=14153)[0m  'test/monte_carlo_diff': tensor(5.2784),
[2m[36m(pid=14153)[0m  'test/monte_carlo_svg_norm': tensor(22.3870),
[2m[36m(pid=14153)[0m  'test/monte_carlo_value': tensor(-59.2187),
[2m[36m(pid=14153)[0m  'true_svg_norm': tensor(30.5406),
[2m[36m(pid=14153)[0m  'true_value': tensor(-64.4971)}
[2m[36m(pid=14153)[0m --------------------------------------------------------------------------------
Result for Experime

Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00005,RUNNING,,False,,,,,
Experiment_a089f_00006,RUNNING,,True,,,,,
Experiment_a089f_00007,RUNNING,,False,,,,,
Experiment_a089f_00008,PENDING,,True,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1.0,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132
Experiment_a089f_00004,TERMINATED,,True,1.0,63.3313,,-64.4971,30.5406


[2m[36m(pid=14153)[0m wandb: Waiting for W&B process to finish, PID 14175
[2m[36m(pid=14153)[0m wandb: Program ended successfully.
[2m[36m(pid=14153)[0m wandb: - 7.90MB of 7.90MB uploaded (0.00MB deduped)
wandb:                                                                                
[2m[36m(pid=14153)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163311-2umibr2x/logs/debug.log
[2m[36m(pid=14153)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163311-2umibr2x/logs/debug-internal.log
[2m[36m(pid=14153)[0m wandb: Run summary:
[2m[36m(pid=14153)[0m wandb:                   stability True
[2m[36m(pid=14153)[0m wandb:             controllability True
[2m[36m(pid=14153)[0m wandb:                    val/loss 49.61028
[2m[36m(pid=14153)[0m wandb:       val/monte_carlo_value -54.77003
[2m[36m(pid=1415

[2m[36m(pid=14153)[0m 


[2m[36m(pid=14289)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14289)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14289)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14289)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid=14289)[0m wandb: 🚀 View run at https://wandb.ai/angelovtt/LQG-SVG/runs/w3q7vlcd
[2m[36m(pid=14289)[0m wandb: Run data is saved locally in /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163439-w3q7vlcd
[2m[36m(pid=14289)[0m wandb: Run `wandb offline` to turn off syncing.


[2m[36m(pid=14289)[0m 


[2m[36m(pid=14289)[0m GPU available: False, used: False
[2m[36m(pid=14289)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14165)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163317-2pbbblla/files/checkpoints)... 
[2m[36m(pid=14165)[0m Done. 0.1s


[2m[36m(pid=14165)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14165)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14165)[0m {'test/analytic_cossim': tensor(0.7693),
[2m[36m(pid=14165)[0m  'test/analytic_diff': tensor(0.7446),
[2m[36m(pid=14165)[0m  'test/analytic_svg_norm': tensor(55.4716),
[2m[36m(pid=14165)[0m  'test/analytic_value': tensor(-69.7089),
[2m[36m(pid=14165)[0m  'test/loss': tensor(62.7056),
[2m[36m(pid=14165)[0m  'test/monte_carlo_cossim': tensor(0.7369),
[2m[36m(pid=14165)[0m  'test/monte_carlo_diff': tensor(10.9868),
[2m[36m(pid=14165)[0m  'test/monte_carlo_svg_norm': tensor(44.3377),
[2m[36m(pid=14165)[0m  'test/monte_carlo_value': tensor(-59.4667),
[2m[36m(pid=14165)[0m  'true_svg_norm': tensor(86.3870),
[2m[36m(pid=14165)[0m  'true_value': tensor(-70.4535)}
[2m[36m(pid=14165)[0m --------------------------------------------------------------------------------
Result for Experim

Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00006,RUNNING,,True,,,,,
Experiment_a089f_00007,RUNNING,,False,,,,,
Experiment_a089f_00008,RUNNING,,True,,,,,
Experiment_a089f_00009,PENDING,,False,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1.0,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132
Experiment_a089f_00004,TERMINATED,,True,1.0,63.3313,,-64.4971,30.5406
Experiment_a089f_00005,TERMINATED,,False,1.0,147.256,,-70.4535,86.387


[2m[36m(pid=14165)[0m wandb: Waiting for W&B process to finish, PID 14202
[2m[36m(pid=14165)[0m wandb: Program ended successfully.
[2m[36m(pid=14165)[0m wandb: - 8.31MB of 8.31MB uploaded (0.00MB deduped)
[2m[36m(pid=14165)[0m wandb: \ 9.17MB of 9.17MB uploaded (0.00MB deduped)
wandb:                                                                                
[2m[36m(pid=14165)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163317-2pbbblla/logs/debug.log
[2m[36m(pid=14165)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163317-2pbbblla/logs/debug-internal.log
[2m[36m(pid=14165)[0m wandb: Run summary:
[2m[36m(pid=14165)[0m wandb:                   stability True
[2m[36m(pid=14165)[0m wandb:             controllability True
[2m[36m(pid=14165)[0m wandb:                    val/loss 63.24604
[2m[36m(p

[2m[36m(pid=14165)[0m 


[2m[36m(pid=14390)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14390)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14390)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14390)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid=14390)[0m wandb: 🚀 View run at https://wandb.ai/angelovtt/LQG-SVG/runs/1ihyllnr
[2m[36m(pid=14390)[0m wandb: Run data is saved locally in /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163613-1ihyllnr
[2m[36m(pid=14390)[0m wandb: Run `wandb offline` to turn off syncing.


[2m[36m(pid=14390)[0m 


[2m[36m(pid=14390)[0m GPU available: False, used: False
[2m[36m(pid=14390)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14390)[0m 2021-03-25 16:36:23,789	INFO trainable.py:100 -- Trainable.setup took 11.974 seconds. If your trainable is slow to initialize, consider setting reuse_actors=True to reduce actor creation overheads.
[2m[36m(pid=14289)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163439-w3q7vlcd/files/checkpoints)... 
[2m[36m(pid=14289)[0m Done. 0.0s


[2m[36m(pid=14289)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14289)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14289)[0m {'test/analytic_cossim': tensor(0.3760),
[2m[36m(pid=14289)[0m  'test/analytic_diff': tensor(3.4601),
[2m[36m(pid=14289)[0m  'test/analytic_svg_norm': tensor(337.5562),
[2m[36m(pid=14289)[0m  'test/analytic_value': tensor(-374.7712),
[2m[36m(pid=14289)[0m  'test/loss': tensor(62.3315),
[2m[36m(pid=14289)[0m  'test/monte_carlo_cossim': tensor(0.3848),
[2m[36m(pid=14289)[0m  'test/monte_carlo_diff': tensor(45.4628),
[2m[36m(pid=14289)[0m  'test/monte_carlo_svg_norm': tensor(316.9302),
[2m[36m(pid=14289)[0m  'test/monte_carlo_value': tensor(-332.7686),
[2m[36m(pid=14289)[0m  'true_svg_norm': tensor(309.2850),
[2m[36m(pid=14289)[0m  'true_value': tensor(-378.2314)}
[2m[36m(pid=14289)[0m --------------------------------------------------------------------------------
Result for E

[2m[36m(pid=14289)[0m wandb: Waiting for W&B process to finish, PID 14298
[2m[36m(pid=14289)[0m wandb: Program ended successfully.


Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00006,RUNNING,,True,,,,,
Experiment_a089f_00007,RUNNING,,False,,,,,
Experiment_a089f_00009,RUNNING,,False,,,,,
Experiment_a089f_00010,PENDING,,True,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1.0,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132
Experiment_a089f_00004,TERMINATED,,True,1.0,63.3313,,-64.4971,30.5406
Experiment_a089f_00005,TERMINATED,,False,1.0,147.256,,-70.4535,86.387


[2m[36m(pid=14289)[0m wandb: - 8.53MB of 8.53MB uploaded (0.00MB deduped)
[2m[36m(pid=14289)[0m wandb: \ 8.84MB of 9.46MB uploaded (0.00MB deduped)
wandb:                                                                                
[2m[36m(pid=14289)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163439-w3q7vlcd/logs/debug.log
[2m[36m(pid=14289)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163439-w3q7vlcd/logs/debug-internal.log
[2m[36m(pid=14289)[0m wandb: Run summary:
[2m[36m(pid=14289)[0m wandb:                   stability True
[2m[36m(pid=14289)[0m wandb:             controllability True
[2m[36m(pid=14289)[0m wandb:                    val/loss 63.1637
[2m[36m(pid=14289)[0m wandb:       val/monte_carlo_value -307.82315
[2m[36m(pid=14289)[0m wandb:    val/monte_carlo_svg_norm 248.34383
[2m[36

[2m[36m(pid=14289)[0m 


[2m[36m(pid=14483)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14483)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14483)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14483)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid=14483)[0m wandb: 🚀 View run at https://wandb.ai/angelovtt/LQG-SVG/runs/1cjt7j51
[2m[36m(pid=14483)[0m wandb: Run data is saved locally in /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163801-1cjt7j51
[2m[36m(pid=14483)[0m wandb: Run `wandb offline` to turn off syncing.


[2m[36m(pid=14483)[0m 
[2m[36m(pid=14255)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14255)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14255)[0m {'test/analytic_cossim': tensor(0.6329),
[2m[36m(pid=14255)[0m  'test/analytic_diff': tensor(36.0466),
[2m[36m(pid=14255)[0m  'test/analytic_svg_norm': tensor(3596.6912),
[2m[36m(pid=14255)[0m  'test/analytic_value': tensor(-1352.9846),
[2m[36m(pid=14255)[0m  'test/loss': tensor(67.4773),
[2m[36m(pid=14255)[0m  'test/monte_carlo_cossim': tensor(0.6295),
[2m[36m(pid=14255)[0m  'test/monte_carlo_diff': tensor(-708.4246),
[2m[36m(pid=14255)[0m  'test/monte_carlo_svg_norm': tensor(6022.3613),
[2m[36m(pid=14255)[0m  'test/monte_carlo_value': tensor(-2097.4558),
[2m[36m(pid=14255)[0m  'true_svg_norm': 
[2m[36m(pid=14255)[0m tensor(8908.1045),
[2m[36m(pid=14255)[0m  'true_value': 
[2m[36m(pid=14255)[0m tensor(-1389.0312)}
[2m[36m(pid=14255)[0m ------

[2m[36m(pid=14255)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163410-2ormee86/files/checkpoints)... 
[2m[36m(pid=14255)[0m Done. 0.1s


Result for Experiment_a089f_00007:
  date: 2021-03-25_16-38-10
  done: true
  experiment_id: 5e4af003e75d48ef94ab8ff4ffda91c1
  hostname: Angelos-MBP
  iterations_since_restore: 1
  node_ip: 192.168.15.11
  pid: 14255
  test/analytic_cossim: 0.6329435706138611
  test/analytic_diff: 36.046630859375
  test/analytic_svg_norm: 3596.691162109375
  test/analytic_value: -1352.984619140625
  test/loss: 67.47732543945312
  test/monte_carlo_cossim: 0.6294918656349182
  test/monte_carlo_diff: -708.424560546875
  test/monte_carlo_svg_norm: 6022.361328125
  test/monte_carlo_value: -2097.455810546875
  time_since_restore: 232.19826984405518
  time_this_iter_s: 232.19826984405518
  time_total_s: 232.19826984405518
  timestamp: 1616701090
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: a089f_00007
  true_svg_norm: 8908.1044921875
  true_value: -1389.03125
  


Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00006,RUNNING,,True,,,,,
Experiment_a089f_00009,RUNNING,,False,,,,,
Experiment_a089f_00010,RUNNING,,True,,,,,
Experiment_a089f_00011,PENDING,,False,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1.0,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132
Experiment_a089f_00004,TERMINATED,,True,1.0,63.3313,,-64.4971,30.5406
Experiment_a089f_00005,TERMINATED,,False,1.0,147.256,,-70.4535,86.387


[2m[36m(pid=14255)[0m wandb: Waiting for W&B process to finish, PID 14264
[2m[36m(pid=14255)[0m wandb: Program ended successfully.
[2m[36m(pid=14390)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163613-1ihyllnr/files/checkpoints)... 
[2m[36m(pid=14390)[0m Done. 0.0s


[2m[36m(pid=14390)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14390)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14390)[0m {'test/analytic_cossim': tensor(0.2534),
[2m[36m(pid=14390)[0m  'test/analytic_diff': tensor(-3.1252),
[2m[36m(pid=14390)[0m  'test/analytic_svg_norm': tensor(139.2991),
[2m[36m(pid=14390)[0m  'test/analytic_value': tensor(-153.2268),
[2m[36m(pid=14390)[0m  'test/loss': tensor(58.0102),
[2m[36m(pid=14390)[0m  'test/monte_carlo_cossim': tensor(0.2869),
[2m[36m(pid=14390)[0m  'test/monte_carlo_diff': tensor(11.8587),
[2m[36m(pid=14390)[0m  'test/monte_carlo_svg_norm': tensor(126.4730),
[2m[36m(pid=14390)[0m  'test/monte_carlo_value': tensor(-138.2429),
[2m[36m(pid=14390)[0m  'true_svg_norm': tensor(260.3735),
[2m[36m(pid=14390)[0m  'true_value': tensor(-150.1016)}
[2m[36m(pid=14390)[0m --------------------------------------------------------------------------------
Result for 

[2m[36m(pid=14390)[0m wandb: Waiting for W&B process to finish, PID 14407
[2m[36m(pid=14390)[0m wandb: Program ended successfully.
[2m[36m(pid=14483)[0m GPU available: False, used: False
[2m[36m(pid=14483)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14483)[0m 2021-03-25 16:38:12,744	INFO trainable.py:100 -- Trainable.setup took 12.318 seconds. If your trainable is slow to initialize, consider setting reuse_actors=True to reduce actor creation overheads.
[2m[36m(pid=14255)[0m wandb: - 8.68MB of 8.68MB uploaded (0.00MB deduped)
[2m[36m(pid=14390)[0m wandb: - 8.16MB of 8.16MB uploaded (0.00MB deduped)
[2m[36m(pid=14255)[0m wandb: \ 9.88MB of 9.91MB uploaded (0.00MB deduped)
[2m[36m(pid=14390)[0m wandb: \ 8.72MB of 8.72MB uploaded (0.00MB deduped)
wandb:                                                                                
wandb:                                                                                
[2m[36m(pid=14255)[0m wandb: Fi

[2m[36m(pid=14255)[0m 


[2m[36m(pid=14390)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163613-1ihyllnr/logs/debug.log
[2m[36m(pid=14390)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163613-1ihyllnr/logs/debug-internal.log
[2m[36m(pid=14390)[0m wandb: Run summary:
[2m[36m(pid=14390)[0m wandb:                   stability True
[2m[36m(pid=14390)[0m wandb:             controllability True
[2m[36m(pid=14390)[0m wandb:                    val/loss 58.57063
[2m[36m(pid=14390)[0m wandb:       val/monte_carlo_value -147.77856
[2m[36m(pid=14390)[0m wandb:    val/monte_carlo_svg_norm 165.57512
[2m[36m(pid=14390)[0m wandb:        val/monte_carlo_diff 2.32307
[2m[36m(pid=14390)[0m wandb:      val/monte_carlo_cossim 0.2981
[2m[36m(pid=14390)[0m wandb:          val/analytic_value -153.22679
[2m[36m(pid=14390)[0m wandb:       val/

[2m[36m(pid=14390)[0m 


[2m[36m(pid=14524)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14527)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14524)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14524)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14524)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid=14524)[0m wandb: 🚀 View run at https://wandb.ai/angelovtt/LQG-SVG/runs/239xueqw
[2m[36m(pid=14524)[0m wandb: Run data is saved locally in /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163831-239xueqw
[2m[36m(pid=14524)[0m wandb: Run `wandb offline` to turn off syncing.
[2m[36m(pid=14527)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14527)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14527)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid

[2m[36m(pid=14524)[0m 
[2m[36m(pid=14527)[0m 


[2m[36m(pid=14524)[0m GPU available: False, used: False
[2m[36m(pid=14524)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14524)[0m 2021-03-25 16:38:42,571	INFO trainable.py:100 -- Trainable.setup took 12.324 seconds. If your trainable is slow to initialize, consider setting reuse_actors=True to reduce actor creation overheads.
[2m[36m(pid=14527)[0m GPU available: False, used: False
[2m[36m(pid=14527)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14527)[0m 2021-03-25 16:38:42,648	INFO trainable.py:100 -- Trainable.setup took 12.401 seconds. If your trainable is slow to initialize, consider setting reuse_actors=True to reduce actor creation overheads.


[2m[36m(pid=14221)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14221)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14221)[0m {'test/analytic_cossim': tensor(0.1443),
[2m[36m(pid=14221)[0m  'test/analytic_diff': tensor(-7.3483),
[2m[36m(pid=14221)[0m  'test/analytic_svg_norm': tensor(4396.1460),
[2m[36m(pid=14221)[0m  'test/analytic_value': tensor(-1861.6594),
[2m[36m(pid=14221)[0m  'test/loss': tensor(50.9894),
[2m[36m(pid=14221)[0m  'test/monte_carlo_cossim': tensor(0.1414),
[2m[36m(pid=14221)[0m  'test/monte_carlo_diff': tensor(62.2527),
[2m[36m(pid=14221)[0m  'test/monte_carlo_svg_norm': tensor(4108.7969),
[2m[36m(pid=14221)[0m  'test/monte_carlo_value': tensor(-1792.0585),
[2m[36m(pid=14221)[0m  'true_svg_norm': tensor(12634.4541),
[2m[36m(pid=14221)[0m  'true_value': tensor(-1854.3112)}
[2m[36m(pid=14221)[0m --------------------------------------------------------------------------------


[2m[36m(pid=14221)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163329-2xu2jguf/files/checkpoints)... 
[2m[36m(pid=14221)[0m Done. 0.1s


Result for Experiment_a089f_00006:
  date: 2021-03-25_16-39-50
  done: true
  experiment_id: efbdf83f90da4485854ae7ea4f067028
  hostname: Angelos-MBP
  iterations_since_restore: 1
  node_ip: 192.168.15.11
  pid: 14221
  test/analytic_cossim: 0.14432017505168915
  test/analytic_diff: -7.3482666015625
  test/analytic_svg_norm: 4396.14599609375
  test/analytic_value: -1861.659423828125
  test/loss: 50.9893913269043
  test/monte_carlo_cossim: 0.14144101738929749
  test/monte_carlo_diff: 62.252685546875
  test/monte_carlo_svg_norm: 4108.796875
  test/monte_carlo_value: -1792.0584716796875
  time_since_restore: 373.20353293418884
  time_this_iter_s: 373.20353293418884
  time_total_s: 373.20353293418884
  timestamp: 1616701190
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: a089f_00006
  true_svg_norm: 12634.4541015625
  true_value: -1854.3111572265625
  


Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00010,RUNNING,,True,,,,,
Experiment_a089f_00011,RUNNING,,False,,,,,
Experiment_a089f_00012,RUNNING,,True,,,,,
Experiment_a089f_00013,PENDING,,False,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1.0,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132
Experiment_a089f_00004,TERMINATED,,True,1.0,63.3313,,-64.4971,30.5406
Experiment_a089f_00005,TERMINATED,,False,1.0,147.256,,-70.4535,86.387


[2m[36m(pid=14221)[0m wandb: Waiting for W&B process to finish, PID 14230
[2m[36m(pid=14221)[0m wandb: Program ended successfully.
[2m[36m(pid=14221)[0m wandb: - 9.48MB of 9.48MB uploaded (0.00MB deduped)
[2m[36m(pid=14483)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163801-1cjt7j51/files/checkpoints)... 
[2m[36m(pid=14483)[0m Done. 0.0s


[2m[36m(pid=14483)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14483)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14483)[0m {'test/analytic_cossim': tensor(0.7319),
[2m[36m(pid=14483)[0m  'test/analytic_diff': tensor(0.3793),
[2m[36m(pid=14483)[0m  'test/analytic_svg_norm': tensor(69.0545),
[2m[36m(pid=14483)[0m  'test/analytic_value': tensor(-82.3405),
[2m[36m(pid=14483)[0m  'test/loss': tensor(63.0157),
[2m[36m(pid=14483)[0m  'test/monte_carlo_cossim': tensor(0.7131),
[2m[36m(pid=14483)[0m  'test/monte_carlo_diff': tensor(4.4111),
[2m[36m(pid=14483)[0m  'test/monte_carlo_svg_norm': tensor(62.5041),
[2m[36m(pid=14483)[0m  'test/monte_carlo_value': tensor(-78.3087),
[2m[36m(pid=14483)[0m  'true_svg_norm': tensor(117.4874),
[2m[36m(pid=14483)[0m  'true_value': tensor(-82.7198)}
[2m[36m(pid=14483)[0m --------------------------------------------------------------------------------
Result for Experim

Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00011,RUNNING,,False,,,,,
Experiment_a089f_00012,RUNNING,,True,,,,,
Experiment_a089f_00013,RUNNING,,False,,,,,
Experiment_a089f_00014,PENDING,,True,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1.0,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132
Experiment_a089f_00004,TERMINATED,,True,1.0,63.3313,,-64.4971,30.5406
Experiment_a089f_00005,TERMINATED,,False,1.0,147.256,,-70.4535,86.387


[2m[36m(pid=14483)[0m wandb: Waiting for W&B process to finish, PID 14500
[2m[36m(pid=14483)[0m wandb: Program ended successfully.
[2m[36m(pid=14221)[0m wandb: \ 10.04MB of 11.51MB uploaded (0.00MB deduped)
[2m[36m(pid=14221)[0m wandb: | 11.51MB of 11.51MB uploaded (0.00MB deduped)
[2m[36m(pid=14483)[0m wandb: - 8.22MB of 8.22MB uploaded (0.00MB deduped)
wandb:                                                                                
wandb:                                                                                
[2m[36m(pid=14221)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163329-2xu2jguf/logs/debug.log
[2m[36m(pid=14221)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163329-2xu2jguf/logs/debug-internal.log
[2m[36m(pid=14221)[0m wandb: Run summary:
[2m[36m(pid=14221)[0m wandb:           

[2m[36m(pid=14483)[0m 
[2m[36m(pid=14221)[0m 


[2m[36m(pid=14640)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14639)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14640)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14640)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14640)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid=14640)[0m wandb: 🚀 View run at https://wandb.ai/angelovtt/LQG-SVG/runs/37megdvb
[2m[36m(pid=14640)[0m wandb: Run data is saved locally in /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_164014-37megdvb
[2m[36m(pid=14640)[0m wandb: Run `wandb offline` to turn off syncing.
[2m[36m(pid=14639)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14639)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14639)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid

[2m[36m(pid=14640)[0m 
[2m[36m(pid=14639)[0m 


[2m[36m(pid=14640)[0m GPU available: False, used: False
[2m[36m(pid=14640)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14640)[0m 2021-03-25 16:40:25,040	INFO trainable.py:100 -- Trainable.setup took 11.859 seconds. If your trainable is slow to initialize, consider setting reuse_actors=True to reduce actor creation overheads.
[2m[36m(pid=14639)[0m GPU available: False, used: False
[2m[36m(pid=14639)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14639)[0m 2021-03-25 16:40:25,095	INFO trainable.py:100 -- Trainable.setup took 11.914 seconds. If your trainable is slow to initialize, consider setting reuse_actors=True to reduce actor creation overheads.
[2m[36m(pid=14524)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163831-239xueqw/files/checkpoints)... 
[2m[36m(pid=14524)[0m Done. 0.0s


[2m[36m(pid=14524)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14524)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14524)[0m {'test/analytic_cossim': tensor(0.3892),
[2m[36m(pid=14524)[0m  'test/analytic_diff': tensor(3.1097),
[2m[36m(pid=14524)[0m  'test/analytic_svg_norm': tensor(103.1134),
[2m[36m(pid=14524)[0m  'test/analytic_value': tensor(-113.1371),
[2m[36m(pid=14524)[0m  'test/loss': tensor(54.8725),
[2m[36m(pid=14524)[0m  'test/monte_carlo_cossim': tensor(0.3107),
[2m[36m(pid=14524)[0m  'test/monte_carlo_diff': tensor(16.2651),
[2m[36m(pid=14524)[0m  'test/monte_carlo_svg_norm': tensor(83.6801),
[2m[36m(pid=14524)[0m  'test/monte_carlo_value': tensor(-99.9817),
[2m[36m(pid=14524)[0m  'true_svg_norm': tensor(241.6638),
[2m[36m(pid=14524)[0m  'true_value': tensor(-116.2468)}
[2m[36m(pid=14524)[0m --------------------------------------------------------------------------------
Result for Exp

[2m[36m(pid=14524)[0m wandb: Waiting for W&B process to finish, PID 14551
[2m[36m(pid=14524)[0m wandb: Program ended successfully.


Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00012,RUNNING,,True,,,,,
Experiment_a089f_00013,RUNNING,,False,,,,,
Experiment_a089f_00014,RUNNING,,True,,,,,
Experiment_a089f_00015,PENDING,,False,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1.0,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132
Experiment_a089f_00004,TERMINATED,,True,1.0,63.3313,,-64.4971,30.5406
Experiment_a089f_00005,TERMINATED,,False,1.0,147.256,,-70.4535,86.387


[2m[36m(pid=14524)[0m wandb: - 8.50MB of 8.50MB uploaded (0.00MB deduped)
[2m[36m(pid=14524)[0m wandb: \ 9.22MB of 9.24MB uploaded (0.00MB deduped)
wandb:                                                                                
[2m[36m(pid=14524)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163831-239xueqw/logs/debug.log
[2m[36m(pid=14524)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163831-239xueqw/logs/debug-internal.log
[2m[36m(pid=14524)[0m wandb: Run summary:
[2m[36m(pid=14524)[0m wandb:                   stability True
[2m[36m(pid=14524)[0m wandb:             controllability True
[2m[36m(pid=14524)[0m wandb:                    val/loss 54.95449
[2m[36m(pid=14524)[0m wandb:       val/monte_carlo_value -113.11488
[2m[36m(pid=14524)[0m wandb:    val/monte_carlo_svg_norm 100.88712
[2m[3

[2m[36m(pid=14524)[0m 


[2m[36m(pid=14719)[0m wandb: Currently logged in as: angelovtt (use `wandb login --relogin` to force relogin)
[2m[36m(pid=14719)[0m wandb: Tracking run with wandb version 0.10.23
[2m[36m(pid=14719)[0m wandb: Syncing run SVG Prediction
[2m[36m(pid=14719)[0m wandb: ⭐️ View project at https://wandb.ai/angelovtt/LQG-SVG
[2m[36m(pid=14719)[0m wandb: 🚀 View run at https://wandb.ai/angelovtt/LQG-SVG/runs/2in0bd3m
[2m[36m(pid=14719)[0m wandb: Run data is saved locally in /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_164115-2in0bd3m
[2m[36m(pid=14719)[0m wandb: Run `wandb offline` to turn off syncing.


[2m[36m(pid=14719)[0m 


[2m[36m(pid=14719)[0m GPU available: False, used: False
[2m[36m(pid=14719)[0m TPU available: None, using: 0 TPU cores
[2m[36m(pid=14719)[0m 2021-03-25 16:41:25,900	INFO trainable.py:100 -- Trainable.setup took 11.704 seconds. If your trainable is slow to initialize, consider setting reuse_actors=True to reduce actor creation overheads.


[2m[36m(pid=14640)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14640)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14640)[0m {'test/analytic_cossim': tensor(0.7957),
[2m[36m(pid=14640)[0m  'test/analytic_diff': tensor(-0.4013),
[2m[36m(pid=14640)[0m  'test/analytic_svg_norm': tensor(38.4007),
[2m[36m(pid=14640)[0m  'test/analytic_value': tensor(-32.4217),
[2m[36m(pid=14640)[0m  'test/loss': tensor(50.9558),
[2m[36m(pid=14640)[0m  'test/monte_carlo_cossim': tensor(0.7881),
[2m[36m(pid=14640)[0m  'test/monte_carlo_diff': tensor(-12.5206),
[2m[36m(pid=14640)[0m  'test/monte_carlo_svg_norm': tensor(60.2033),
[2m[36m(pid=14640)[0m  'test/monte_carlo_value': tensor(-44.5411),
[2m[36m(pid=14640)[0m  
[2m[36m(pid=14640)[0m 'true_svg_norm': tensor(81.8542),
[2m[36m(pid=14640)[0m  'true_value': 
[2m[36m(pid=14640)[0m tensor(-32.0204)}
[2m[36m(pid=14640)[0m ---------------------------------------------

[2m[36m(pid=14640)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_164014-37megdvb/files/checkpoints)... Done. 0.0s


Result for Experiment_a089f_00013:
  date: 2021-03-25_16-41-56
  done: true
  experiment_id: 91275e9187fe45898b807c63b1cacfaa
  hostname: Angelos-MBP
  iterations_since_restore: 1
  node_ip: 192.168.15.11
  pid: 14640
  test/analytic_cossim: 0.7957186102867126
  test/analytic_diff: -0.40129852294921875
  test/analytic_svg_norm: 38.40068435668945
  test/analytic_value: -32.42171859741211
  test/loss: 50.955787658691406
  test/monte_carlo_cossim: 0.7881116271018982
  test/monte_carlo_diff: -12.520633697509766
  test/monte_carlo_svg_norm: 60.20326232910156
  test/monte_carlo_value: -44.541053771972656
  time_since_restore: 91.63208103179932
  time_this_iter_s: 91.63208103179932
  time_total_s: 91.63208103179932
  timestamp: 1616701316
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: a089f_00013
  true_svg_norm: 81.85417175292969
  true_value: -32.02042007446289
  


Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00012,RUNNING,,True,,,,,
Experiment_a089f_00014,RUNNING,,True,,,,,
Experiment_a089f_00015,RUNNING,,False,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1.0,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132
Experiment_a089f_00004,TERMINATED,,True,1.0,63.3313,,-64.4971,30.5406
Experiment_a089f_00005,TERMINATED,,False,1.0,147.256,,-70.4535,86.387
Experiment_a089f_00006,TERMINATED,,True,1.0,373.204,,-1854.31,12634.5


[2m[36m(pid=14640)[0m wandb: Waiting for W&B process to finish, PID 14661
[2m[36m(pid=14640)[0m wandb: Program ended successfully.
[2m[36m(pid=14640)[0m wandb: - 8.27MB of 8.27MB uploaded (0.00MB deduped)
[2m[36m(pid=14640)[0m wandb: \ 8.78MB of 8.78MB uploaded (0.00MB deduped)
wandb:                                                                                
[2m[36m(pid=14640)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_164014-37megdvb/logs/debug.log
[2m[36m(pid=14640)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_164014-37megdvb/logs/debug-internal.log
[2m[36m(pid=14640)[0m wandb: Run summary:
[2m[36m(pid=14640)[0m wandb:                   stability True
[2m[36m(pid=14640)[0m wandb:             controllability True
[2m[36m(pid=14640)[0m wandb:                    val/loss 51.39606
[2m[36m(p

[2m[36m(pid=14640)[0m 


[2m[36m(pid=14527)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163831-22ne03zy/files/checkpoints)... 
[2m[36m(pid=14527)[0m Done. 0.1s


[2m[36m(pid=14527)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14527)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14527)[0m {'test/analytic_cossim': tensor(0.8996),
[2m[36m(pid=14527)[0m  'test/analytic_diff': tensor(-3.7853),
[2m[36m(pid=14527)[0m  'test/analytic_svg_norm': tensor(844.6976),
[2m[36m(pid=14527)[0m  'test/analytic_value': tensor(-593.7148),
[2m[36m(pid=14527)[0m  'test/loss': tensor(64.7193),
[2m[36m(pid=14527)[0m  'test/monte_carlo_cossim': tensor(0.9020),
[2m[36m(pid=14527)[0m  'test/monte_carlo_diff': tensor(-41.2167),
[2m[36m(pid=14527)[0m  'test/monte_carlo_svg_norm': tensor(924.8589),
[2m[36m(pid=14527)[0m  'test/monte_carlo_value': tensor(-631.1462),
[2m[36m(pid=14527)[0m  'true_svg_norm': tensor(2379.5413),
[2m[36m(pid=14527)[0m  'true_value': tensor(-589.9294)}
[2m[36m(pid=14527)[0m --------------------------------------------------------------------------------
Result fo

Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00014,RUNNING,,True,,,,,
Experiment_a089f_00015,RUNNING,,False,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1.0,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132
Experiment_a089f_00004,TERMINATED,,True,1.0,63.3313,,-64.4971,30.5406
Experiment_a089f_00005,TERMINATED,,False,1.0,147.256,,-70.4535,86.387
Experiment_a089f_00006,TERMINATED,,True,1.0,373.204,,-1854.31,12634.5
Experiment_a089f_00007,TERMINATED,,False,1.0,232.198,,-1389.03,8908.1


[2m[36m(pid=14527)[0m wandb: Waiting for W&B process to finish, PID 14550
[2m[36m(pid=14527)[0m wandb: Program ended successfully.
[2m[36m(pid=14527)[0m wandb: - 9.03MB of 9.03MB uploaded (0.00MB deduped)
[2m[36m(pid=14527)[0m wandb: \ 10.30MB of 10.30MB uploaded (0.00MB deduped)
wandb:                                                                                
[2m[36m(pid=14527)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163831-22ne03zy/logs/debug.log
[2m[36m(pid=14527)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_163831-22ne03zy/logs/debug-internal.log
[2m[36m(pid=14527)[0m wandb: Run summary:
[2m[36m(pid=14527)[0m wandb:                   stability True
[2m[36m(pid=14527)[0m wandb:             controllability True
[2m[36m(pid=14527)[0m wandb:                    val/loss 65.11938
[2m[36m

[2m[36m(pid=14527)[0m 
[2m[36m(pid=14639)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14639)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14639)[0m {'test/analytic_cossim': tensor(-0.0649),
[2m[36m(pid=14639)[0m  'test/analytic_diff': tensor(22.3801),
[2m[36m(pid=14639)[0m  'test/analytic_svg_norm': tensor(2338.8069),
[2m[36m(pid=14639)[0m  'test/analytic_value': tensor(-1304.7456),
[2m[36m(pid=14639)[0m  'test/loss': tensor(63.5903),
[2m[36m(pid=14639)[0m  'test/monte_carlo_cossim': tensor(-0.0527),
[2m[36m(pid=14639)[0m  'test/monte_carlo_diff': tensor(-253.0359),
[2m[36m(pid=14639)[0m  'test/monte_carlo_svg_norm': tensor(2849.1038),
[2m[36m(pid=14639)[0m  'test/monte_carlo_value': tensor(-1580.1616),
[2m[36m(pid=14639)[0m  'true_svg_norm': tensor(1412.3882),
[2m[36m(pid=14639)[0m  'true_value': tensor(-1327.1257)}
[2m[36m(pid=14639)[0m --------------------------------------------------------

[2m[36m(pid=14639)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_164014-2z7f9pqn/files/checkpoints)... 
[2m[36m(pid=14639)[0m Done. 0.0s


Result for Experiment_a089f_00014:
  date: 2021-03-25_16-43-10
  done: true
  experiment_id: 9e957f77b04c47c480cede233daf2abc
  hostname: Angelos-MBP
  iterations_since_restore: 1
  node_ip: 192.168.15.11
  pid: 14639
  test/analytic_cossim: -0.06487153470516205
  test/analytic_diff: 22.380126953125
  test/analytic_svg_norm: 2338.806884765625
  test/analytic_value: -1304.74560546875
  test/loss: 63.5903434753418
  test/monte_carlo_cossim: -0.052662819623947144
  test/monte_carlo_diff: -253.035888671875
  test/monte_carlo_svg_norm: 2849.103759765625
  test/monte_carlo_value: -1580.16162109375
  time_since_restore: 165.40422320365906
  time_this_iter_s: 165.40422320365906
  time_total_s: 165.40422320365906
  timestamp: 1616701390
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: a089f_00014
  true_svg_norm: 1412.38818359375
  true_value: -1327.125732421875
  


Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00015,RUNNING,,False,,,,,
Experiment_a089f_00000,TERMINATED,,True,1.0,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1.0,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1.0,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1.0,118.327,,-90.8687,74.5132
Experiment_a089f_00004,TERMINATED,,True,1.0,63.3313,,-64.4971,30.5406
Experiment_a089f_00005,TERMINATED,,False,1.0,147.256,,-70.4535,86.387
Experiment_a089f_00006,TERMINATED,,True,1.0,373.204,,-1854.31,12634.5
Experiment_a089f_00007,TERMINATED,,False,1.0,232.198,,-1389.03,8908.1
Experiment_a089f_00008,TERMINATED,,True,1.0,168.498,,-378.231,309.285


[2m[36m(pid=14639)[0m wandb: Waiting for W&B process to finish, PID 14660
[2m[36m(pid=14639)[0m wandb: Program ended successfully.
[2m[36m(pid=14719)[0m wandb: Adding directory to artifact (/Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_164115-2in0bd3m/files/checkpoints)... 
[2m[36m(pid=14719)[0m Done. 0.0s


[2m[36m(pid=14719)[0m --------------------------------------------------------------------------------
[2m[36m(pid=14719)[0m DATALOADER:0 TEST RESULTS
[2m[36m(pid=14719)[0m {'test/analytic_cossim': tensor(-0.0902),
[2m[36m(pid=14719)[0m  'test/analytic_diff': tensor(4.0318),
[2m[36m(pid=14719)[0m  'test/analytic_svg_norm': tensor(287.7411),
[2m[36m(pid=14719)[0m  'test/analytic_value': tensor(-245.2268),
[2m[36m(pid=14719)[0m  'test/loss': tensor(37.9452),
[2m[36m(pid=14719)[0m  'test/monte_carlo_cossim': tensor(-0.1077),
[2m[36m(pid=14719)[0m  'test/monte_carlo_diff': tensor(-3.4216),
[2m[36m(pid=14719)[0m  'test/monte_carlo_svg_norm': tensor(312.3213),
[2m[36m(pid=14719)[0m  'test/monte_carlo_value': tensor(-252.6802),
[2m[36m(pid=14719)[0m  'true_svg_norm': tensor(102.8296),
[2m[36m(pid=14719)[0m  'true_value': tensor(-249.2586)}
[2m[36m(pid=14719)[0m --------------------------------------------------------------------------------
Result for

Trial name,status,loc,policy/module/model_input_norm,iter,total time (s),test/loss,true_value,true_svg_norm
Experiment_a089f_00000,TERMINATED,,True,1,105.798,,-594.717,1737.42
Experiment_a089f_00001,TERMINATED,,False,1,157.194,,-65.6031,89.1708
Experiment_a089f_00002,TERMINATED,,True,1,96.4929,,-134.075,124.17
Experiment_a089f_00003,TERMINATED,,False,1,118.327,,-90.8687,74.5132
Experiment_a089f_00004,TERMINATED,,True,1,63.3313,,-64.4971,30.5406
Experiment_a089f_00005,TERMINATED,,False,1,147.256,,-70.4535,86.387
Experiment_a089f_00006,TERMINATED,,True,1,373.204,,-1854.31,12634.5
Experiment_a089f_00007,TERMINATED,,False,1,232.198,,-1389.03,8908.1
Experiment_a089f_00008,TERMINATED,,True,1,168.498,,-378.231,309.285
Experiment_a089f_00009,TERMINATED,,False,1,108.634,,-150.102,260.374


[2m[36m(pid=14719)[0m wandb: Waiting for W&B process to finish, PID 14730
[2m[36m(pid=14719)[0m wandb: Program ended successfully.
[2m[36m(pid=14639)[0m wandb: - 8.94MB of 8.94MB uploaded (0.00MB deduped)
[2m[36m(pid=14719)[0m wandb: - 8.68MB of 8.68MB uploaded (0.00MB deduped)
[2m[36m(pid=14639)[0m wandb: \ 10.09MB of 10.12MB uploaded (0.00MB deduped)
[2m[36m(pid=14719)[0m wandb: \ 9.51MB of 9.51MB uploaded (0.00MB deduped)
wandb:                                                                                
[2m[36m(pid=14639)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_164014-2z7f9pqn/logs/debug.log
[2m[36m(pid=14639)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_164014-2z7f9pqn/logs/debug-internal.log
[2m[36m(pid=14639)[0m wandb: Run summary:
[2m[36m(pid=14639)[0m wandb:                   stab

[2m[36m(pid=14639)[0m 


[2m[36m(pid=14719)[0m wandb: Find user logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_164115-2in0bd3m/logs/debug.log
[2m[36m(pid=14719)[0m wandb: Find internal logs for this run at: /Users/angelolovatto/Repositories/personal/LQG-SVG/experiments/wandb/run-20210325_164115-2in0bd3m/logs/debug-internal.log
[2m[36m(pid=14719)[0m wandb: Run summary:
[2m[36m(pid=14719)[0m wandb:                   stability True
[2m[36m(pid=14719)[0m wandb:             controllability True
[2m[36m(pid=14719)[0m wandb:                    val/loss 38.32711
[2m[36m(pid=14719)[0m wandb:       val/monte_carlo_value -277.2457
[2m[36m(pid=14719)[0m wandb:    val/monte_carlo_svg_norm 332.45038
[2m[36m(pid=14719)[0m wandb:        val/monte_carlo_diff -27.98708
[2m[36m(pid=14719)[0m wandb:      val/monte_carlo_cossim -0.11457
[2m[36m(pid=14719)[0m wandb:          val/analytic_value -245.22684
[2m[36m(pid=14719)[0m wandb:       v

In [6]:
ray.shutdown()