In [None]:
"""

plot_parallel_coordinate
========================

.. autofunction:: optuna.visualization.plot_parallel_coordinate

The following code snippet shows how to plot the high-dimensional parameter relationships.

"""
import matplotlib.pyplot as plt
import optuna
from plotly.io import show


def objective(trial):
    x = trial.suggest_float("x", -100, 100)
    y = trial.suggest_categorical("y", [-1, 0, 1])
    return x**2 + y


sampler = optuna.samplers.TPESampler(seed=10)
study = optuna.create_study(sampler=sampler)
study.optimize(objective, n_trials=10)

fig = optuna.visualization.plot_parallel_coordinate(study, params=["x", "y"])
fig.show()

In [1]:
import gymnasium as gym
from classic_rl.rl_corrector import *
env = gym.make("MountainCarContinuous-v0") 

corrector = PPOCorrector(env, None, None, hidden_size=64, lr_actor=3e-4, lr_critic=1e-3, gamma=0.99, k_epochs=80, clip_epsilon=0.2, gae_lambda=1, action_std_init = 0.2, decay_action_std = 0.05, min_action_std = 0.01, max_training_timesteps = 3e6, max_ep_len = 1000, update_factor = 2)


log = corrector.train()

2025-06-30 10:26:40.491204: I tensorflow/core/util/port.cc:153] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2025-06-30 10:26:40.517070: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX_VNNI FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.
[32m2025-06-30 10:26:42.290[0m | [1mINFO    [0m | [36mclassic_rl.rl_corrector[0m:[36m__init__[0m:[36m368[0m - [1mgamma 0.99, clip_epsilon 0.2, gae_lambda 1, lr_actor 0.0003, lr_critic 0.001, k_epochs 80, vf_loss_coef 0.5, action_std 0.2, decay_action_std_rate 0.05, min_action_std 0.01[0m
[32m2025-06-30 10:26:42.290[0m | [1mINFO    [0m | [36mclassic_rl.rl_corrector[

Device set to : NVIDIA RTX 2000 Ada Generation Laptop GPU


[32m2025-06-30 10:29:06.183[0m | [1mINFO    [0m | [36mclassic_rl.rl_corrector[0m:[36mtrain[0m:[36m457[0m - [1mEpisode : 2 	 Timestep : 2000 	 Average Reward : -4.94[0m
[32m2025-06-30 10:31:29.585[0m | [1mINFO    [0m | [36mclassic_rl.rl_corrector[0m:[36mtrain[0m:[36m457[0m - [1mEpisode : 5 	 Timestep : 4000 	 Average Reward : -26.02[0m
[32m2025-06-30 10:33:52.753[0m | [1mINFO    [0m | [36mclassic_rl.rl_corrector[0m:[36mtrain[0m:[36m457[0m - [1mEpisode : 7 	 Timestep : 6000 	 Average Reward : -53.74[0m
[32m2025-06-30 10:36:14.321[0m | [1mINFO    [0m | [36mclassic_rl.rl_corrector[0m:[36mtrain[0m:[36m457[0m - [1mEpisode : 9 	 Timestep : 8000 	 Average Reward : -70.87[0m


KeyboardInterrupt: 