In [6]:
import gymnasium as gym
import gymnasium_robotics
from stable_baselines3 import PPO
from stable_baselines3.common.callbacks import CheckpointCallback
from stable_baselines3.common.vec_env import VecVideoRecorder, DummyVecEnv
from stable_baselines3.common.vec_env import VecNormalize

In [2]:
def setup_video_recorder(env, video_folder='videos/', record_freq=10000, video_length=200):
    """
    Wrap the environment with a video recorder to capture agent performances.
    """
    env = VecVideoRecorder(
        env,
        video_folder,
        record_video_trigger=lambda step: step % record_freq == 0,
        video_length=video_length,
        name_prefix='rl-agent'
    )
    return env

def setup_checkpoint_callback(checkpoint_dir='checkpoints/', save_freq=1000):
    """
    Create a callback that saves the model at regular intervals.
    """
    checkpoint_callback = CheckpointCallback(
        save_freq=save_freq,
        save_path=checkpoint_dir,
        name_prefix='rl_model',
        save_replay_buffer=True,
        save_vecnormalize=True,
        verbose=1
    )
    return checkpoint_callback


In [9]:
# Parameters
env_id = 'HandManipulateEgg-v1'
total_timesteps = 1000000
checkpoint_dir = './checkpoints/'
video_folder = './videos/'


def make_env():
    return gym.make("HandManipulateEgg-v1", reward_type='dense', render_mode='rgb_array')
env = DummyVecEnv([make_env])
env = VecNormalize(env, norm_obs=True, norm_reward=True)
env = setup_video_recorder(env, video_folder=video_folder)

# test making larger
policy_kwargs = dict(
    net_arch=dict(
        pi=[256, 256, 256],
        vf=[256, 256, 256]
    )
)

model = PPO("MultiInputPolicy", env, policy_kwargs=policy_kwargs, verbose=1)



model = PPO('MultiInputPolicy', env, verbose=1, policy_kwargs=policy_kwargs, tensorboard_log="./ppo_tensorboard/")


checkpoint_callback = setup_checkpoint_callback(checkpoint_dir=checkpoint_dir)

model.learn(total_timesteps=total_timesteps, callback=checkpoint_callback)
model.save(f"{checkpoint_dir}/final_model")

env.close()

Using cpu device
Logging to ./ppo_tensorboard/PPO_4




Saving video to C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-0-to-step-200.mp4
MoviePy - Building video C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-0-to-step-200.mp4.
MoviePy - Writing video C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-0-to-step-200.mp4



                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-0-to-step-200.mp4
---------------------------------
| rollout/           |          |
|    success_rate    | 0        |
| time/              |          |
|    fps             | 361      |
|    iterations      | 1        |
|    time_elapsed    | 5        |
|    total_timesteps | 2048     |
---------------------------------
----------------------------------------
| rollout/                |            |
|    success_rate         | 0          |
| time/                   |            |
|    fps                  | 342        |
|    iterations           | 2          |
|    time_elapsed         | 11         |
|    total_timesteps      | 4096       |
| train/                  |            |
|    approx_kl            | 0.11741668 |
|    clip_fraction        | 0.571      |
|    clip_range           | 0.2        |
|    entropy_loss         | -28.4      |
|    explained_var

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-10000-to-step-10200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 321       |
|    iterations           | 5         |
|    time_elapsed         | 31        |
|    total_timesteps      | 10240     |
| train/                  |           |
|    approx_kl            | 0.1900878 |
|    clip_fraction        | 0.657     |
|    clip_range           | 0.2       |
|    entropy_loss         | -28.3     |
|    explained_variance   | 0.513     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.138    |
|    n_updates            | 40        |
|    policy_gradient_loss | -0.106    |
|    std                  | 0.993     |
|    value_loss           | 0.0411    |
---------------------------------------
-----------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-20000-to-step-20200.mp4
----------------------------------------
| rollout/                |            |
|    success_rate         | 0          |
| time/                   |            |
|    fps                  | 319        |
|    iterations           | 10         |
|    time_elapsed         | 64         |
|    total_timesteps      | 20480      |
| train/                  |            |
|    approx_kl            | 0.25273165 |
|    clip_fraction        | 0.697      |
|    clip_range           | 0.2        |
|    entropy_loss         | -28.1      |
|    explained_variance   | 0.83       |
|    learning_rate        | 0.0003     |
|    loss                 | -0.128     |
|    n_updates            | 90         |
|    policy_gradient_loss | -0.109     |
|    std                  | 0.983      |
|    value_loss           | 0.0241     |
-------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-30000-to-step-30200.mp4
----------------------------------------
| rollout/                |            |
|    success_rate         | 0          |
| time/                   |            |
|    fps                  | 305        |
|    iterations           | 15         |
|    time_elapsed         | 100        |
|    total_timesteps      | 30720      |
| train/                  |            |
|    approx_kl            | 0.33910376 |
|    clip_fraction        | 0.727      |
|    clip_range           | 0.2        |
|    entropy_loss         | -27.8      |
|    explained_variance   | 0.795      |
|    learning_rate        | 0.0003     |
|    loss                 | -0.15      |
|    n_updates            | 140        |
|    policy_gradient_loss | -0.108     |
|    std                  | 0.972      |
|    value_loss           | 0.0145     |
-------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-40000-to-step-40200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 309      |
|    iterations           | 20       |
|    time_elapsed         | 132      |
|    total_timesteps      | 40960    |
| train/                  |          |
|    approx_kl            | 0.388529 |
|    clip_fraction        | 0.746    |
|    clip_range           | 0.2      |
|    entropy_loss         | -27.6    |
|    explained_variance   | 0.921    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.122   |
|    n_updates            | 190      |
|    policy_gradient_loss | -0.104   |
|    std                  | 0.96     |
|    value_loss           | 0.0096   |
--------------------------------------
--------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-50000-to-step-50200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 312       |
|    iterations           | 25        |
|    time_elapsed         | 163       |
|    total_timesteps      | 51200     |
| train/                  |           |
|    approx_kl            | 0.5208669 |
|    clip_fraction        | 0.756     |
|    clip_range           | 0.2       |
|    entropy_loss         | -27.4     |
|    explained_variance   | 0.906     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.143    |
|    n_updates            | 240       |
|    policy_gradient_loss | -0.106    |
|    std                  | 0.954     |
|    value_loss           | 0.00719   |
---------------------------------------
-----------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-60000-to-step-60200.mp4
----------------------------------------
| rollout/                |            |
|    success_rate         | 0          |
| time/                   |            |
|    fps                  | 314        |
|    iterations           | 30         |
|    time_elapsed         | 195        |
|    total_timesteps      | 61440      |
| train/                  |            |
|    approx_kl            | 0.52680176 |
|    clip_fraction        | 0.762      |
|    clip_range           | 0.2        |
|    entropy_loss         | -27.1      |
|    explained_variance   | 0.935      |
|    learning_rate        | 0.0003     |
|    loss                 | -0.148     |
|    n_updates            | 290        |
|    policy_gradient_loss | -0.106     |
|    std                  | 0.938      |
|    value_loss           | 0.00742    |
-------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-70000-to-step-70200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 316       |
|    iterations           | 35        |
|    time_elapsed         | 226       |
|    total_timesteps      | 71680     |
| train/                  |           |
|    approx_kl            | 0.6257741 |
|    clip_fraction        | 0.775     |
|    clip_range           | 0.2       |
|    entropy_loss         | -26.9     |
|    explained_variance   | 0.92      |
|    learning_rate        | 0.0003    |
|    loss                 | -0.144    |
|    n_updates            | 340       |
|    policy_gradient_loss | -0.107    |
|    std                  | 0.927     |
|    value_loss           | 0.00632   |
---------------------------------------
-----------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-80000-to-step-80200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 317       |
|    iterations           | 40        |
|    time_elapsed         | 257       |
|    total_timesteps      | 81920     |
| train/                  |           |
|    approx_kl            | 0.7905158 |
|    clip_fraction        | 0.789     |
|    clip_range           | 0.2       |
|    entropy_loss         | -26.5     |
|    explained_variance   | 0.928     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.128    |
|    n_updates            | 390       |
|    policy_gradient_loss | -0.111    |
|    std                  | 0.912     |
|    value_loss           | 0.00548   |
---------------------------------------
-----------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-90000-to-step-90200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 318       |
|    iterations           | 45        |
|    time_elapsed         | 289       |
|    total_timesteps      | 92160     |
| train/                  |           |
|    approx_kl            | 0.9996568 |
|    clip_fraction        | 0.802     |
|    clip_range           | 0.2       |
|    entropy_loss         | -26.5     |
|    explained_variance   | 0.878     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.149    |
|    n_updates            | 440       |
|    policy_gradient_loss | -0.108    |
|    std                  | 0.908     |
|    value_loss           | 0.00516   |
---------------------------------------
-----------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-100000-to-step-100200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 319       |
|    iterations           | 49        |
|    time_elapsed         | 314       |
|    total_timesteps      | 100352    |
| train/                  |           |
|    approx_kl            | 0.9342977 |
|    clip_fraction        | 0.793     |
|    clip_range           | 0.2       |
|    entropy_loss         | -26.3     |
|    explained_variance   | 0.916     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.135    |
|    n_updates            | 480       |
|    policy_gradient_loss | -0.103    |
|    std                  | 0.901     |
|    value_loss           | 0.00436   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-110000-to-step-110200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 319       |
|    iterations           | 54        |
|    time_elapsed         | 345       |
|    total_timesteps      | 110592    |
| train/                  |           |
|    approx_kl            | 1.0251194 |
|    clip_fraction        | 0.799     |
|    clip_range           | 0.2       |
|    entropy_loss         | -26.1     |
|    explained_variance   | 0.876     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.119    |
|    n_updates            | 530       |
|    policy_gradient_loss | -0.101    |
|    std                  | 0.892     |
|    value_loss           | 0.00521   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-120000-to-step-120200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 320       |
|    iterations           | 59        |
|    time_elapsed         | 377       |
|    total_timesteps      | 120832    |
| train/                  |           |
|    approx_kl            | 1.0898232 |
|    clip_fraction        | 0.806     |
|    clip_range           | 0.2       |
|    entropy_loss         | -25.9     |
|    explained_variance   | 0.933     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.134    |
|    n_updates            | 580       |
|    policy_gradient_loss | -0.108    |
|    std                  | 0.882     |
|    value_loss           | 0.00356   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-130000-to-step-130200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 320       |
|    iterations           | 64        |
|    time_elapsed         | 408       |
|    total_timesteps      | 131072    |
| train/                  |           |
|    approx_kl            | 1.3596272 |
|    clip_fraction        | 0.805     |
|    clip_range           | 0.2       |
|    entropy_loss         | -25.6     |
|    explained_variance   | 0.942     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.151    |
|    n_updates            | 630       |
|    policy_gradient_loss | -0.102    |
|    std                  | 0.868     |
|    value_loss           | 0.00355   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-140000-to-step-140200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 321      |
|    iterations           | 69       |
|    time_elapsed         | 440      |
|    total_timesteps      | 141312   |
| train/                  |          |
|    approx_kl            | 1.3738   |
|    clip_fraction        | 0.821    |
|    clip_range           | 0.2      |
|    entropy_loss         | -25.4    |
|    explained_variance   | 0.917    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.15    |
|    n_updates            | 680      |
|    policy_gradient_loss | -0.102   |
|    std                  | 0.862    |
|    value_loss           | 0.00306  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-150000-to-step-150200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 321       |
|    iterations           | 74        |
|    time_elapsed         | 471       |
|    total_timesteps      | 151552    |
| train/                  |           |
|    approx_kl            | 1.1971256 |
|    clip_fraction        | 0.811     |
|    clip_range           | 0.2       |
|    entropy_loss         | -25.2     |
|    explained_variance   | 0.944     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.144    |
|    n_updates            | 730       |
|    policy_gradient_loss | -0.105    |
|    std                  | 0.853     |
|    value_loss           | 0.0031    |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-160000-to-step-160200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 321      |
|    iterations           | 79       |
|    time_elapsed         | 503      |
|    total_timesteps      | 161792   |
| train/                  |          |
|    approx_kl            | 1.583122 |
|    clip_fraction        | 0.821    |
|    clip_range           | 0.2      |
|    entropy_loss         | -24.9    |
|    explained_variance   | 0.911    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.113   |
|    n_updates            | 780      |
|    policy_gradient_loss | -0.0966  |
|    std                  | 0.841    |
|    value_loss           | 0.00471  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-170000-to-step-170200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 321       |
|    iterations           | 84        |
|    time_elapsed         | 534       |
|    total_timesteps      | 172032    |
| train/                  |           |
|    approx_kl            | 1.7436666 |
|    clip_fraction        | 0.817     |
|    clip_range           | 0.2       |
|    entropy_loss         | -24.7     |
|    explained_variance   | 0.954     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.13     |
|    n_updates            | 830       |
|    policy_gradient_loss | -0.1      |
|    std                  | 0.833     |
|    value_loss           | 0.00382   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-180000-to-step-180200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 321       |
|    iterations           | 88        |
|    time_elapsed         | 559       |
|    total_timesteps      | 180224    |
| train/                  |           |
|    approx_kl            | 1.9611627 |
|    clip_fraction        | 0.837     |
|    clip_range           | 0.2       |
|    entropy_loss         | -24.6     |
|    explained_variance   | 0.9       |
|    learning_rate        | 0.0003    |
|    loss                 | -0.16     |
|    n_updates            | 870       |
|    policy_gradient_loss | -0.108    |
|    std                  | 0.826     |
|    value_loss           | 0.00391   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-190000-to-step-190200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 322      |
|    iterations           | 93       |
|    time_elapsed         | 591      |
|    total_timesteps      | 190464   |
| train/                  |          |
|    approx_kl            | 2.293045 |
|    clip_fraction        | 0.827    |
|    clip_range           | 0.2      |
|    entropy_loss         | -24.3    |
|    explained_variance   | 0.912    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.153   |
|    n_updates            | 920      |
|    policy_gradient_loss | -0.102   |
|    std                  | 0.816    |
|    value_loss           | 0.00317  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-200000-to-step-200200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 322       |
|    iterations           | 98        |
|    time_elapsed         | 623       |
|    total_timesteps      | 200704    |
| train/                  |           |
|    approx_kl            | 1.8377573 |
|    clip_fraction        | 0.84      |
|    clip_range           | 0.2       |
|    entropy_loss         | -24.1     |
|    explained_variance   | 0.954     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.11     |
|    n_updates            | 970       |
|    policy_gradient_loss | -0.103    |
|    std                  | 0.81      |
|    value_loss           | 0.00244   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-210000-to-step-210200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 322       |
|    iterations           | 103       |
|    time_elapsed         | 654       |
|    total_timesteps      | 210944    |
| train/                  |           |
|    approx_kl            | 2.7823148 |
|    clip_fraction        | 0.842     |
|    clip_range           | 0.2       |
|    entropy_loss         | -24       |
|    explained_variance   | 0.932     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.146    |
|    n_updates            | 1020      |
|    policy_gradient_loss | -0.101    |
|    std                  | 0.806     |
|    value_loss           | 0.00311   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-220000-to-step-220200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 322      |
|    iterations           | 108      |
|    time_elapsed         | 686      |
|    total_timesteps      | 221184   |
| train/                  |          |
|    approx_kl            | 3.039705 |
|    clip_fraction        | 0.844    |
|    clip_range           | 0.2      |
|    entropy_loss         | -23.9    |
|    explained_variance   | 0.946    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.136   |
|    n_updates            | 1070     |
|    policy_gradient_loss | -0.1     |
|    std                  | 0.798    |
|    value_loss           | 0.00382  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-230000-to-step-230200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 322      |
|    iterations           | 113      |
|    time_elapsed         | 717      |
|    total_timesteps      | 231424   |
| train/                  |          |
|    approx_kl            | 2.501054 |
|    clip_fraction        | 0.833    |
|    clip_range           | 0.2      |
|    entropy_loss         | -23.7    |
|    explained_variance   | 0.936    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.136   |
|    n_updates            | 1120     |
|    policy_gradient_loss | -0.101   |
|    std                  | 0.79     |
|    value_loss           | 0.00338  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-240000-to-step-240200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 322       |
|    iterations           | 118       |
|    time_elapsed         | 749       |
|    total_timesteps      | 241664    |
| train/                  |           |
|    approx_kl            | 2.7053256 |
|    clip_fraction        | 0.85      |
|    clip_range           | 0.2       |
|    entropy_loss         | -23.4     |
|    explained_variance   | 0.942     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.12     |
|    n_updates            | 1170      |
|    policy_gradient_loss | -0.0987   |
|    std                  | 0.781     |
|    value_loss           | 0.00383   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-250000-to-step-250200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 322      |
|    iterations           | 123      |
|    time_elapsed         | 780      |
|    total_timesteps      | 251904   |
| train/                  |          |
|    approx_kl            | 2.993666 |
|    clip_fraction        | 0.852    |
|    clip_range           | 0.2      |
|    entropy_loss         | -23.2    |
|    explained_variance   | 0.884    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.1     |
|    n_updates            | 1220     |
|    policy_gradient_loss | -0.104   |
|    std                  | 0.774    |
|    value_loss           | 0.00553  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-260000-to-step-260200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 322       |
|    iterations           | 128       |
|    time_elapsed         | 812       |
|    total_timesteps      | 262144    |
| train/                  |           |
|    approx_kl            | 2.8896341 |
|    clip_fraction        | 0.854     |
|    clip_range           | 0.2       |
|    entropy_loss         | -23.1     |
|    explained_variance   | 0.906     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.149    |
|    n_updates            | 1270      |
|    policy_gradient_loss | -0.096    |
|    std                  | 0.771     |
|    value_loss           | 0.00362   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-270000-to-step-270200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 322       |
|    iterations           | 132       |
|    time_elapsed         | 837       |
|    total_timesteps      | 270336    |
| train/                  |           |
|    approx_kl            | 3.0948665 |
|    clip_fraction        | 0.844     |
|    clip_range           | 0.2       |
|    entropy_loss         | -23       |
|    explained_variance   | 0.95      |
|    learning_rate        | 0.0003    |
|    loss                 | -0.126    |
|    n_updates            | 1310      |
|    policy_gradient_loss | -0.0939   |
|    std                  | 0.765     |
|    value_loss           | 0.0033    |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-280000-to-step-280200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 322       |
|    iterations           | 137       |
|    time_elapsed         | 869       |
|    total_timesteps      | 280576    |
| train/                  |           |
|    approx_kl            | 4.2974167 |
|    clip_fraction        | 0.847     |
|    clip_range           | 0.2       |
|    entropy_loss         | -22.8     |
|    explained_variance   | 0.942     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.149    |
|    n_updates            | 1360      |
|    policy_gradient_loss | -0.0934   |
|    std                  | 0.759     |
|    value_loss           | 0.00387   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-290000-to-step-290200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 322       |
|    iterations           | 142       |
|    time_elapsed         | 900       |
|    total_timesteps      | 290816    |
| train/                  |           |
|    approx_kl            | 3.6681623 |
|    clip_fraction        | 0.855     |
|    clip_range           | 0.2       |
|    entropy_loss         | -22.7     |
|    explained_variance   | 0.929     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.127    |
|    n_updates            | 1410      |
|    policy_gradient_loss | -0.101    |
|    std                  | 0.754     |
|    value_loss           | 0.00382   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-300000-to-step-300200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 322      |
|    iterations           | 147      |
|    time_elapsed         | 932      |
|    total_timesteps      | 301056   |
| train/                  |          |
|    approx_kl            | 3.848617 |
|    clip_fraction        | 0.859    |
|    clip_range           | 0.2      |
|    entropy_loss         | -22.6    |
|    explained_variance   | 0.946    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.151   |
|    n_updates            | 1460     |
|    policy_gradient_loss | -0.102   |
|    std                  | 0.749    |
|    value_loss           | 0.00378  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-310000-to-step-310200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 322       |
|    iterations           | 152       |
|    time_elapsed         | 963       |
|    total_timesteps      | 311296    |
| train/                  |           |
|    approx_kl            | 3.1488242 |
|    clip_fraction        | 0.855     |
|    clip_range           | 0.2       |
|    entropy_loss         | -22.5     |
|    explained_variance   | 0.949     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.15     |
|    n_updates            | 1510      |
|    policy_gradient_loss | -0.0904   |
|    std                  | 0.746     |
|    value_loss           | 0.00389   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-320000-to-step-320200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 322       |
|    iterations           | 157       |
|    time_elapsed         | 995       |
|    total_timesteps      | 321536    |
| train/                  |           |
|    approx_kl            | 5.6017423 |
|    clip_fraction        | 0.857     |
|    clip_range           | 0.2       |
|    entropy_loss         | -22.5     |
|    explained_variance   | 0.956     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.143    |
|    n_updates            | 1560      |
|    policy_gradient_loss | -0.096    |
|    std                  | 0.747     |
|    value_loss           | 0.00379   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-330000-to-step-330200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 162      |
|    time_elapsed         | 1027     |
|    total_timesteps      | 331776   |
| train/                  |          |
|    approx_kl            | 4.138023 |
|    clip_fraction        | 0.854    |
|    clip_range           | 0.2      |
|    entropy_loss         | -22.4    |
|    explained_variance   | 0.952    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.145   |
|    n_updates            | 1610     |
|    policy_gradient_loss | -0.0979  |
|    std                  | 0.74     |
|    value_loss           | 0.00418  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-340000-to-step-340200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 167       |
|    time_elapsed         | 1058      |
|    total_timesteps      | 342016    |
| train/                  |           |
|    approx_kl            | 4.1398735 |
|    clip_fraction        | 0.868     |
|    clip_range           | 0.2       |
|    entropy_loss         | -22.1     |
|    explained_variance   | 0.942     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.15     |
|    n_updates            | 1660      |
|    policy_gradient_loss | -0.0966   |
|    std                  | 0.733     |
|    value_loss           | 0.00418   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-350000-to-step-350200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 322      |
|    iterations           | 171      |
|    time_elapsed         | 1084     |
|    total_timesteps      | 350208   |
| train/                  |          |
|    approx_kl            | 4.081022 |
|    clip_fraction        | 0.86     |
|    clip_range           | 0.2      |
|    entropy_loss         | -22      |
|    explained_variance   | 0.95     |
|    learning_rate        | 0.0003   |
|    loss                 | -0.152   |
|    n_updates            | 1700     |
|    policy_gradient_loss | -0.0984  |
|    std                  | 0.725    |
|    value_loss           | 0.00357  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-360000-to-step-360200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 176      |
|    time_elapsed         | 1115     |
|    total_timesteps      | 360448   |
| train/                  |          |
|    approx_kl            | 4.13359  |
|    clip_fraction        | 0.854    |
|    clip_range           | 0.2      |
|    entropy_loss         | -21.7    |
|    explained_variance   | 0.941    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.14    |
|    n_updates            | 1750     |
|    policy_gradient_loss | -0.0918  |
|    std                  | 0.718    |
|    value_loss           | 0.00426  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-370000-to-step-370200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 181      |
|    time_elapsed         | 1147     |
|    total_timesteps      | 370688   |
| train/                  |          |
|    approx_kl            | 4.674803 |
|    clip_fraction        | 0.861    |
|    clip_range           | 0.2      |
|    entropy_loss         | -21.6    |
|    explained_variance   | 0.944    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.13    |
|    n_updates            | 1800     |
|    policy_gradient_loss | -0.0919  |
|    std                  | 0.713    |
|    value_loss           | 0.00275  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-380000-to-step-380200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 186      |
|    time_elapsed         | 1179     |
|    total_timesteps      | 380928   |
| train/                  |          |
|    approx_kl            | 4.68264  |
|    clip_fraction        | 0.875    |
|    clip_range           | 0.2      |
|    entropy_loss         | -21.5    |
|    explained_variance   | 0.946    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.118   |
|    n_updates            | 1850     |
|    policy_gradient_loss | -0.0932  |
|    std                  | 0.709    |
|    value_loss           | 0.00312  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-390000-to-step-390200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 191      |
|    time_elapsed         | 1210     |
|    total_timesteps      | 391168   |
| train/                  |          |
|    approx_kl            | 5.209869 |
|    clip_fraction        | 0.869    |
|    clip_range           | 0.2      |
|    entropy_loss         | -21.3    |
|    explained_variance   | 0.948    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.119   |
|    n_updates            | 1900     |
|    policy_gradient_loss | -0.0909  |
|    std                  | 0.703    |
|    value_loss           | 0.00297  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-400000-to-step-400200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 196       |
|    time_elapsed         | 1241      |
|    total_timesteps      | 401408    |
| train/                  |           |
|    approx_kl            | 5.7396655 |
|    clip_fraction        | 0.873     |
|    clip_range           | 0.2       |
|    entropy_loss         | -21.2     |
|    explained_variance   | 0.938     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.138    |
|    n_updates            | 1950      |
|    policy_gradient_loss | -0.0982   |
|    std                  | 0.698     |
|    value_loss           | 0.0037    |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-410000-to-step-410200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 201      |
|    time_elapsed         | 1273     |
|    total_timesteps      | 411648   |
| train/                  |          |
|    approx_kl            | 8.663297 |
|    clip_fraction        | 0.871    |
|    clip_range           | 0.2      |
|    entropy_loss         | -20.9    |
|    explained_variance   | 0.902    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.124   |
|    n_updates            | 2000     |
|    policy_gradient_loss | -0.0896  |
|    std                  | 0.69     |
|    value_loss           | 0.00329  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-420000-to-step-420200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 206       |
|    time_elapsed         | 1304      |
|    total_timesteps      | 421888    |
| train/                  |           |
|    approx_kl            | 4.4985347 |
|    clip_fraction        | 0.877     |
|    clip_range           | 0.2       |
|    entropy_loss         | -20.8     |
|    explained_variance   | 0.941     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.116    |
|    n_updates            | 2050      |
|    policy_gradient_loss | -0.086    |
|    std                  | 0.687     |
|    value_loss           | 0.00344   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-430000-to-step-430200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 211      |
|    time_elapsed         | 1336     |
|    total_timesteps      | 432128   |
| train/                  |          |
|    approx_kl            | 5.127624 |
|    clip_fraction        | 0.864    |
|    clip_range           | 0.2      |
|    entropy_loss         | -20.7    |
|    explained_variance   | 0.935    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.132   |
|    n_updates            | 2100     |
|    policy_gradient_loss | -0.0896  |
|    std                  | 0.681    |
|    value_loss           | 0.00528  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-440000-to-step-440200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 215      |
|    time_elapsed         | 1361     |
|    total_timesteps      | 440320   |
| train/                  |          |
|    approx_kl            | 5.373305 |
|    clip_fraction        | 0.862    |
|    clip_range           | 0.2      |
|    entropy_loss         | -20.5    |
|    explained_variance   | 0.976    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.12    |
|    n_updates            | 2140     |
|    policy_gradient_loss | -0.0883  |
|    std                  | 0.675    |
|    value_loss           | 0.0033   |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-450000-to-step-450200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 220       |
|    time_elapsed         | 1393      |
|    total_timesteps      | 450560    |
| train/                  |           |
|    approx_kl            | 57.353245 |
|    clip_fraction        | 0.876     |
|    clip_range           | 0.2       |
|    entropy_loss         | -20.4     |
|    explained_variance   | 0.967     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.153    |
|    n_updates            | 2190      |
|    policy_gradient_loss | -0.0931   |
|    std                  | 0.672     |
|    value_loss           | 0.00429   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-460000-to-step-460200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 225      |
|    time_elapsed         | 1424     |
|    total_timesteps      | 460800   |
| train/                  |          |
|    approx_kl            | 7.082454 |
|    clip_fraction        | 0.874    |
|    clip_range           | 0.2      |
|    entropy_loss         | -20.2    |
|    explained_variance   | 0.953    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.117   |
|    n_updates            | 2240     |
|    policy_gradient_loss | -0.0905  |
|    std                  | 0.667    |
|    value_loss           | 0.00477  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-470000-to-step-470200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 230       |
|    time_elapsed         | 1456      |
|    total_timesteps      | 471040    |
| train/                  |           |
|    approx_kl            | 7.4801044 |
|    clip_fraction        | 0.87      |
|    clip_range           | 0.2       |
|    entropy_loss         | -20       |
|    explained_variance   | 0.926     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.118    |
|    n_updates            | 2290      |
|    policy_gradient_loss | -0.0972   |
|    std                  | 0.66      |
|    value_loss           | 0.00366   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-480000-to-step-480200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 235       |
|    time_elapsed         | 1488      |
|    total_timesteps      | 481280    |
| train/                  |           |
|    approx_kl            | 7.3245597 |
|    clip_fraction        | 0.875     |
|    clip_range           | 0.2       |
|    entropy_loss         | -19.8     |
|    explained_variance   | 0.942     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.152    |
|    n_updates            | 2340      |
|    policy_gradient_loss | -0.0898   |
|    std                  | 0.654     |
|    value_loss           | 0.00289   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-490000-to-step-490200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 240      |
|    time_elapsed         | 1519     |
|    total_timesteps      | 491520   |
| train/                  |          |
|    approx_kl            | 9.311942 |
|    clip_fraction        | 0.879    |
|    clip_range           | 0.2      |
|    entropy_loss         | -19.8    |
|    explained_variance   | 0.952    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.0962  |
|    n_updates            | 2390     |
|    policy_gradient_loss | -0.095   |
|    std                  | 0.653    |
|    value_loss           | 0.00395  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-500000-to-step-500200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 245      |
|    time_elapsed         | 1551     |
|    total_timesteps      | 501760   |
| train/                  |          |
|    approx_kl            | 8.580927 |
|    clip_fraction        | 0.877    |
|    clip_range           | 0.2      |
|    entropy_loss         | -19.6    |
|    explained_variance   | 0.919    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.122   |
|    n_updates            | 2440     |
|    policy_gradient_loss | -0.0906  |
|    std                  | 0.649    |
|    value_loss           | 0.00361  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-510000-to-step-510200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 250       |
|    time_elapsed         | 1583      |
|    total_timesteps      | 512000    |
| train/                  |           |
|    approx_kl            | 10.335347 |
|    clip_fraction        | 0.886     |
|    clip_range           | 0.2       |
|    entropy_loss         | -19.5     |
|    explained_variance   | 0.955     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.147    |
|    n_updates            | 2490      |
|    policy_gradient_loss | -0.103    |
|    std                  | 0.643     |
|    value_loss           | 0.00385   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-520000-to-step-520200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 255      |
|    time_elapsed         | 1615     |
|    total_timesteps      | 522240   |
| train/                  |          |
|    approx_kl            | 9.656731 |
|    clip_fraction        | 0.874    |
|    clip_range           | 0.2      |
|    entropy_loss         | -19.3    |
|    explained_variance   | 0.948    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.0873  |
|    n_updates            | 2540     |
|    policy_gradient_loss | -0.0788  |
|    std                  | 0.637    |
|    value_loss           | 0.00395  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-530000-to-step-530200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 259      |
|    time_elapsed         | 1640     |
|    total_timesteps      | 530432   |
| train/                  |          |
|    approx_kl            | 9.963623 |
|    clip_fraction        | 0.879    |
|    clip_range           | 0.2      |
|    entropy_loss         | -19.2    |
|    explained_variance   | 0.956    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.145   |
|    n_updates            | 2580     |
|    policy_gradient_loss | -0.093   |
|    std                  | 0.634    |
|    value_loss           | 0.0031   |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-540000-to-step-540200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 264      |
|    time_elapsed         | 1671     |
|    total_timesteps      | 540672   |
| train/                  |          |
|    approx_kl            | 11.43391 |
|    clip_fraction        | 0.886    |
|    clip_range           | 0.2      |
|    entropy_loss         | -19      |
|    explained_variance   | 0.958    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.143   |
|    n_updates            | 2630     |
|    policy_gradient_loss | -0.0968  |
|    std                  | 0.628    |
|    value_loss           | 0.0029   |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-550000-to-step-550200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 269      |
|    time_elapsed         | 1703     |
|    total_timesteps      | 550912   |
| train/                  |          |
|    approx_kl            | 9.566885 |
|    clip_fraction        | 0.881    |
|    clip_range           | 0.2      |
|    entropy_loss         | -18.9    |
|    explained_variance   | 0.952    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.137   |
|    n_updates            | 2680     |
|    policy_gradient_loss | -0.0883  |
|    std                  | 0.626    |
|    value_loss           | 0.0036   |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-560000-to-step-560200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 274       |
|    time_elapsed         | 1735      |
|    total_timesteps      | 561152    |
| train/                  |           |
|    approx_kl            | 10.545723 |
|    clip_fraction        | 0.883     |
|    clip_range           | 0.2       |
|    entropy_loss         | -18.8     |
|    explained_variance   | 0.962     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.12     |
|    n_updates            | 2730      |
|    policy_gradient_loss | -0.0908   |
|    std                  | 0.622     |
|    value_loss           | 0.00353   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-570000-to-step-570200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 279      |
|    time_elapsed         | 1766     |
|    total_timesteps      | 571392   |
| train/                  |          |
|    approx_kl            | 9.776851 |
|    clip_fraction        | 0.882    |
|    clip_range           | 0.2      |
|    entropy_loss         | -18.6    |
|    explained_variance   | 0.966    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.138   |
|    n_updates            | 2780     |
|    policy_gradient_loss | -0.094   |
|    std                  | 0.617    |
|    value_loss           | 0.00332  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-580000-to-step-580200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 284      |
|    time_elapsed         | 1798     |
|    total_timesteps      | 581632   |
| train/                  |          |
|    approx_kl            | 9.774224 |
|    clip_fraction        | 0.888    |
|    clip_range           | 0.2      |
|    entropy_loss         | -18.5    |
|    explained_variance   | 0.96     |
|    learning_rate        | 0.0003   |
|    loss                 | -0.13    |
|    n_updates            | 2830     |
|    policy_gradient_loss | -0.0947  |
|    std                  | 0.613    |
|    value_loss           | 0.00345  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-590000-to-step-590200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 289      |
|    time_elapsed         | 1830     |
|    total_timesteps      | 591872   |
| train/                  |          |
|    approx_kl            | 9.754068 |
|    clip_fraction        | 0.887    |
|    clip_range           | 0.2      |
|    entropy_loss         | -18.4    |
|    explained_variance   | 0.965    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.148   |
|    n_updates            | 2880     |
|    policy_gradient_loss | -0.0842  |
|    std                  | 0.61     |
|    value_loss           | 0.00275  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-600000-to-step-600200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 294       |
|    time_elapsed         | 1861      |
|    total_timesteps      | 602112    |
| train/                  |           |
|    approx_kl            | 11.481815 |
|    clip_fraction        | 0.885     |
|    clip_range           | 0.2       |
|    entropy_loss         | -18.3     |
|    explained_variance   | 0.968     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.139    |
|    n_updates            | 2930      |
|    policy_gradient_loss | -0.0839   |
|    std                  | 0.605     |
|    value_loss           | 0.00254   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-610000-to-step-610200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 298       |
|    time_elapsed         | 1886      |
|    total_timesteps      | 610304    |
| train/                  |           |
|    approx_kl            | 23.399338 |
|    clip_fraction        | 0.886     |
|    clip_range           | 0.2       |
|    entropy_loss         | -18.2     |
|    explained_variance   | 0.943     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.118    |
|    n_updates            | 2970      |
|    policy_gradient_loss | -0.0853   |
|    std                  | 0.602     |
|    value_loss           | 0.00372   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-620000-to-step-620200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 303       |
|    time_elapsed         | 1918      |
|    total_timesteps      | 620544    |
| train/                  |           |
|    approx_kl            | 11.181622 |
|    clip_fraction        | 0.894     |
|    clip_range           | 0.2       |
|    entropy_loss         | -18.1     |
|    explained_variance   | 0.958     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.143    |
|    n_updates            | 3020      |
|    policy_gradient_loss | -0.0836   |
|    std                  | 0.599     |
|    value_loss           | 0.00369   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-630000-to-step-630200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 308       |
|    time_elapsed         | 1949      |
|    total_timesteps      | 630784    |
| train/                  |           |
|    approx_kl            | 48.384956 |
|    clip_fraction        | 0.895     |
|    clip_range           | 0.2       |
|    entropy_loss         | -17.9     |
|    explained_variance   | 0.962     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.1      |
|    n_updates            | 3070      |
|    policy_gradient_loss | -0.0813   |
|    std                  | 0.595     |
|    value_loss           | 0.0034    |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-640000-to-step-640200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 313       |
|    time_elapsed         | 1981      |
|    total_timesteps      | 641024    |
| train/                  |           |
|    approx_kl            | 14.627535 |
|    clip_fraction        | 0.89      |
|    clip_range           | 0.2       |
|    entropy_loss         | -17.9     |
|    explained_variance   | 0.976     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.111    |
|    n_updates            | 3120      |
|    policy_gradient_loss | -0.0831   |
|    std                  | 0.594     |
|    value_loss           | 0.00291   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-650000-to-step-650200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 318      |
|    time_elapsed         | 2013     |
|    total_timesteps      | 651264   |
| train/                  |          |
|    approx_kl            | 38.69296 |
|    clip_fraction        | 0.887    |
|    clip_range           | 0.2      |
|    entropy_loss         | -17.8    |
|    explained_variance   | 0.959    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.13    |
|    n_updates            | 3170     |
|    policy_gradient_loss | -0.0681  |
|    std                  | 0.592    |
|    value_loss           | 0.0037   |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-660000-to-step-660200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 323       |
|    time_elapsed         | 2044      |
|    total_timesteps      | 661504    |
| train/                  |           |
|    approx_kl            | 18.584023 |
|    clip_fraction        | 0.89      |
|    clip_range           | 0.2       |
|    entropy_loss         | -17.8     |
|    explained_variance   | 0.934     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.124    |
|    n_updates            | 3220      |
|    policy_gradient_loss | -0.0677   |
|    std                  | 0.592     |
|    value_loss           | 0.00369   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-670000-to-step-670200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 328       |
|    time_elapsed         | 2076      |
|    total_timesteps      | 671744    |
| train/                  |           |
|    approx_kl            | 16.598442 |
|    clip_fraction        | 0.89      |
|    clip_range           | 0.2       |
|    entropy_loss         | -17.7     |
|    explained_variance   | 0.975     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.133    |
|    n_updates            | 3270      |
|    policy_gradient_loss | -0.0864   |
|    std                  | 0.588     |
|    value_loss           | 0.00382   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-680000-to-step-680200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 333       |
|    time_elapsed         | 2107      |
|    total_timesteps      | 681984    |
| train/                  |           |
|    approx_kl            | 25.596453 |
|    clip_fraction        | 0.894     |
|    clip_range           | 0.2       |
|    entropy_loss         | -17.6     |
|    explained_variance   | 0.961     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.102    |
|    n_updates            | 3320      |
|    policy_gradient_loss | -0.0793   |
|    std                  | 0.586     |
|    value_loss           | 0.00302   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-690000-to-step-690200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 338      |
|    time_elapsed         | 2139     |
|    total_timesteps      | 692224   |
| train/                  |          |
|    approx_kl            | 12.88732 |
|    clip_fraction        | 0.892    |
|    clip_range           | 0.2      |
|    entropy_loss         | -17.4    |
|    explained_variance   | 0.962    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.119   |
|    n_updates            | 3370     |
|    policy_gradient_loss | -0.0903  |
|    std                  | 0.579    |
|    value_loss           | 0.00321  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-700000-to-step-700200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 342      |
|    time_elapsed         | 2164     |
|    total_timesteps      | 700416   |
| train/                  |          |
|    approx_kl            | 14.9775  |
|    clip_fraction        | 0.892    |
|    clip_range           | 0.2      |
|    entropy_loss         | -17.3    |
|    explained_variance   | 0.965    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.118   |
|    n_updates            | 3410     |
|    policy_gradient_loss | -0.086   |
|    std                  | 0.577    |
|    value_loss           | 0.00393  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-710000-to-step-710200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 347       |
|    time_elapsed         | 2196      |
|    total_timesteps      | 710656    |
| train/                  |           |
|    approx_kl            | 11.924132 |
|    clip_fraction        | 0.888     |
|    clip_range           | 0.2       |
|    entropy_loss         | -17.3     |
|    explained_variance   | 0.955     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.108    |
|    n_updates            | 3460      |
|    policy_gradient_loss | -0.0831   |
|    std                  | 0.578     |
|    value_loss           | 0.00349   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-720000-to-step-720200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 352       |
|    time_elapsed         | 2228      |
|    total_timesteps      | 720896    |
| train/                  |           |
|    approx_kl            | 13.935592 |
|    clip_fraction        | 0.897     |
|    clip_range           | 0.2       |
|    entropy_loss         | -17.2     |
|    explained_variance   | 0.953     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.126    |
|    n_updates            | 3510      |
|    policy_gradient_loss | -0.0771   |
|    std                  | 0.575     |
|    value_loss           | 0.00388   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-730000-to-step-730200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 357       |
|    time_elapsed         | 2259      |
|    total_timesteps      | 731136    |
| train/                  |           |
|    approx_kl            | 19.888214 |
|    clip_fraction        | 0.891     |
|    clip_range           | 0.2       |
|    entropy_loss         | -17.1     |
|    explained_variance   | 0.944     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.148    |
|    n_updates            | 3560      |
|    policy_gradient_loss | -0.0834   |
|    std                  | 0.572     |
|    value_loss           | 0.004     |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-740000-to-step-740200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 362       |
|    time_elapsed         | 2291      |
|    total_timesteps      | 741376    |
| train/                  |           |
|    approx_kl            | 13.183958 |
|    clip_fraction        | 0.896     |
|    clip_range           | 0.2       |
|    entropy_loss         | -17       |
|    explained_variance   | 0.952     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.141    |
|    n_updates            | 3610      |
|    policy_gradient_loss | -0.0864   |
|    std                  | 0.569     |
|    value_loss           | 0.00354   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-750000-to-step-750200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 367       |
|    time_elapsed         | 2322      |
|    total_timesteps      | 751616    |
| train/                  |           |
|    approx_kl            | 33.413227 |
|    clip_fraction        | 0.885     |
|    clip_range           | 0.2       |
|    entropy_loss         | -16.8     |
|    explained_variance   | 0.948     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.124    |
|    n_updates            | 3660      |
|    policy_gradient_loss | -0.0657   |
|    std                  | 0.566     |
|    value_loss           | 0.00258   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-760000-to-step-760200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 372       |
|    time_elapsed         | 2354      |
|    total_timesteps      | 761856    |
| train/                  |           |
|    approx_kl            | 15.004797 |
|    clip_fraction        | 0.899     |
|    clip_range           | 0.2       |
|    entropy_loss         | -16.8     |
|    explained_variance   | 0.951     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.115    |
|    n_updates            | 3710      |
|    policy_gradient_loss | -0.0763   |
|    std                  | 0.562     |
|    value_loss           | 0.00335   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-770000-to-step-770200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 377      |
|    time_elapsed         | 2385     |
|    total_timesteps      | 772096   |
| train/                  |          |
|    approx_kl            | 12.59623 |
|    clip_fraction        | 0.895    |
|    clip_range           | 0.2      |
|    entropy_loss         | -16.6    |
|    explained_variance   | 0.962    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.114   |
|    n_updates            | 3760     |
|    policy_gradient_loss | -0.0741  |
|    std                  | 0.557    |
|    value_loss           | 0.00423  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-780000-to-step-780200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 381       |
|    time_elapsed         | 2410      |
|    total_timesteps      | 780288    |
| train/                  |           |
|    approx_kl            | 10.774435 |
|    clip_fraction        | 0.892     |
|    clip_range           | 0.2       |
|    entropy_loss         | -16.5     |
|    explained_variance   | 0.981     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.121    |
|    n_updates            | 3800      |
|    policy_gradient_loss | -0.0816   |
|    std                  | 0.554     |
|    value_loss           | 0.0029    |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-790000-to-step-790200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 386       |
|    time_elapsed         | 2442      |
|    total_timesteps      | 790528    |
| train/                  |           |
|    approx_kl            | 22.702383 |
|    clip_fraction        | 0.895     |
|    clip_range           | 0.2       |
|    entropy_loss         | -16.4     |
|    explained_variance   | 0.944     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.0762   |
|    n_updates            | 3850      |
|    policy_gradient_loss | -0.073    |
|    std                  | 0.553     |
|    value_loss           | 0.00355   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-800000-to-step-800200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 391       |
|    time_elapsed         | 2473      |
|    total_timesteps      | 800768    |
| train/                  |           |
|    approx_kl            | 24.529465 |
|    clip_fraction        | 0.898     |
|    clip_range           | 0.2       |
|    entropy_loss         | -16.3     |
|    explained_variance   | 0.95      |
|    learning_rate        | 0.0003    |
|    loss                 | -0.137    |
|    n_updates            | 3900      |
|    policy_gradient_loss | -0.0729   |
|    std                  | 0.55      |
|    value_loss           | 0.00413   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-810000-to-step-810200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 396       |
|    time_elapsed         | 2505      |
|    total_timesteps      | 811008    |
| train/                  |           |
|    approx_kl            | 16.274971 |
|    clip_fraction        | 0.903     |
|    clip_range           | 0.2       |
|    entropy_loss         | -16.2     |
|    explained_variance   | 0.933     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.143    |
|    n_updates            | 3950      |
|    policy_gradient_loss | -0.0594   |
|    std                  | 0.546     |
|    value_loss           | 0.00477   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-820000-to-step-820200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 401       |
|    time_elapsed         | 2536      |
|    total_timesteps      | 821248    |
| train/                  |           |
|    approx_kl            | 13.139738 |
|    clip_fraction        | 0.899     |
|    clip_range           | 0.2       |
|    entropy_loss         | -16.1     |
|    explained_variance   | 0.96      |
|    learning_rate        | 0.0003    |
|    loss                 | -0.0664   |
|    n_updates            | 4000      |
|    policy_gradient_loss | -0.0726   |
|    std                  | 0.544     |
|    value_loss           | 0.00379   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-830000-to-step-830200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 406       |
|    time_elapsed         | 2567      |
|    total_timesteps      | 831488    |
| train/                  |           |
|    approx_kl            | 17.780554 |
|    clip_fraction        | 0.902     |
|    clip_range           | 0.2       |
|    entropy_loss         | -16       |
|    explained_variance   | 0.927     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.144    |
|    n_updates            | 4050      |
|    policy_gradient_loss | -0.0702   |
|    std                  | 0.543     |
|    value_loss           | 0.00343   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-840000-to-step-840200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 411       |
|    time_elapsed         | 2599      |
|    total_timesteps      | 841728    |
| train/                  |           |
|    approx_kl            | 12.168095 |
|    clip_fraction        | 0.896     |
|    clip_range           | 0.2       |
|    entropy_loss         | -15.9     |
|    explained_variance   | 0.961     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.118    |
|    n_updates            | 4100      |
|    policy_gradient_loss | -0.057    |
|    std                  | 0.539     |
|    value_loss           | 0.00409   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-850000-to-step-850200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 416       |
|    time_elapsed         | 2630      |
|    total_timesteps      | 851968    |
| train/                  |           |
|    approx_kl            | 15.974403 |
|    clip_fraction        | 0.904     |
|    clip_range           | 0.2       |
|    entropy_loss         | -15.8     |
|    explained_variance   | 0.977     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.121    |
|    n_updates            | 4150      |
|    policy_gradient_loss | -0.0692   |
|    std                  | 0.536     |
|    value_loss           | 0.00359   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-860000-to-step-860200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 421       |
|    time_elapsed         | 2662      |
|    total_timesteps      | 862208    |
| train/                  |           |
|    approx_kl            | 51.534576 |
|    clip_fraction        | 0.908     |
|    clip_range           | 0.2       |
|    entropy_loss         | -15.7     |
|    explained_variance   | 0.979     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.0913   |
|    n_updates            | 4200      |
|    policy_gradient_loss | -0.0778   |
|    std                  | 0.535     |
|    value_loss           | 0.00302   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-870000-to-step-870200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 425       |
|    time_elapsed         | 2687      |
|    total_timesteps      | 870400    |
| train/                  |           |
|    approx_kl            | 29.316446 |
|    clip_fraction        | 0.903     |
|    clip_range           | 0.2       |
|    entropy_loss         | -15.7     |
|    explained_variance   | 0.978     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.106    |
|    n_updates            | 4240      |
|    policy_gradient_loss | -0.0544   |
|    std                  | 0.533     |
|    value_loss           | 0.00288   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-880000-to-step-880200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 430       |
|    time_elapsed         | 2719      |
|    total_timesteps      | 880640    |
| train/                  |           |
|    approx_kl            | 21.976112 |
|    clip_fraction        | 0.901     |
|    clip_range           | 0.2       |
|    entropy_loss         | -15.7     |
|    explained_variance   | 0.976     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.137    |
|    n_updates            | 4290      |
|    policy_gradient_loss | -0.0526   |
|    std                  | 0.532     |
|    value_loss           | 0.00287   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-890000-to-step-890200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 435       |
|    time_elapsed         | 2750      |
|    total_timesteps      | 890880    |
| train/                  |           |
|    approx_kl            | 14.470791 |
|    clip_fraction        | 0.899     |
|    clip_range           | 0.2       |
|    entropy_loss         | -15.6     |
|    explained_variance   | 0.969     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.089    |
|    n_updates            | 4340      |
|    policy_gradient_loss | -0.066    |
|    std                  | 0.529     |
|    value_loss           | 0.00354   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-900000-to-step-900200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 440       |
|    time_elapsed         | 2782      |
|    total_timesteps      | 901120    |
| train/                  |           |
|    approx_kl            | 22.683617 |
|    clip_fraction        | 0.904     |
|    clip_range           | 0.2       |
|    entropy_loss         | -15.6     |
|    explained_variance   | 0.943     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.121    |
|    n_updates            | 4390      |
|    policy_gradient_loss | -0.0768   |
|    std                  | 0.529     |
|    value_loss           | 0.00562   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-910000-to-step-910200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 445      |
|    time_elapsed         | 2814     |
|    total_timesteps      | 911360   |
| train/                  |          |
|    approx_kl            | 15.17538 |
|    clip_fraction        | 0.906    |
|    clip_range           | 0.2      |
|    entropy_loss         | -15.5    |
|    explained_variance   | 0.976    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.144   |
|    n_updates            | 4440     |
|    policy_gradient_loss | -0.0678  |
|    std                  | 0.527    |
|    value_loss           | 0.0041   |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-920000-to-step-920200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 323      |
|    iterations           | 450      |
|    time_elapsed         | 2845     |
|    total_timesteps      | 921600   |
| train/                  |          |
|    approx_kl            | 18.01215 |
|    clip_fraction        | 0.904    |
|    clip_range           | 0.2      |
|    entropy_loss         | -15.4    |
|    explained_variance   | 0.968    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.136   |
|    n_updates            | 4490     |
|    policy_gradient_loss | -0.0661  |
|    std                  | 0.526    |
|    value_loss           | 0.00428  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-930000-to-step-930200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 455       |
|    time_elapsed         | 2877      |
|    total_timesteps      | 931840    |
| train/                  |           |
|    approx_kl            | 20.015503 |
|    clip_fraction        | 0.906     |
|    clip_range           | 0.2       |
|    entropy_loss         | -15.3     |
|    explained_variance   | 0.97      |
|    learning_rate        | 0.0003    |
|    loss                 | -0.127    |
|    n_updates            | 4540      |
|    policy_gradient_loss | -0.0643   |
|    std                  | 0.523     |
|    value_loss           | 0.00349   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-940000-to-step-940200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 460       |
|    time_elapsed         | 2908      |
|    total_timesteps      | 942080    |
| train/                  |           |
|    approx_kl            | 37.414585 |
|    clip_fraction        | 0.902     |
|    clip_range           | 0.2       |
|    entropy_loss         | -15.1     |
|    explained_variance   | 0.967     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.12     |
|    n_updates            | 4590      |
|    policy_gradient_loss | -0.0612   |
|    std                  | 0.519     |
|    value_loss           | 0.00502   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-950000-to-step-950200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 464       |
|    time_elapsed         | 2933      |
|    total_timesteps      | 950272    |
| train/                  |           |
|    approx_kl            | 38.844753 |
|    clip_fraction        | 0.901     |
|    clip_range           | 0.2       |
|    entropy_loss         | -15       |
|    explained_variance   | 0.935     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.121    |
|    n_updates            | 4630      |
|    policy_gradient_loss | -0.0657   |
|    std                  | 0.515     |
|    value_loss           | 0.0033    |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-960000-to-step-960200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 469       |
|    time_elapsed         | 2965      |
|    total_timesteps      | 960512    |
| train/                  |           |
|    approx_kl            | 25.322777 |
|    clip_fraction        | 0.908     |
|    clip_range           | 0.2       |
|    entropy_loss         | -14.9     |
|    explained_variance   | 0.913     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.135    |
|    n_updates            | 4680      |
|    policy_gradient_loss | -0.068    |
|    std                  | 0.513     |
|    value_loss           | 0.00438   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-970000-to-step-970200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 323       |
|    iterations           | 474       |
|    time_elapsed         | 2996      |
|    total_timesteps      | 970752    |
| train/                  |           |
|    approx_kl            | 22.419868 |
|    clip_fraction        | 0.904     |
|    clip_range           | 0.2       |
|    entropy_loss         | -14.9     |
|    explained_variance   | 0.95      |
|    learning_rate        | 0.0003    |
|    loss                 | -0.123    |
|    n_updates            | 4730      |
|    policy_gradient_loss | -0.0638   |
|    std                  | 0.511     |
|    value_loss           | 0.00351   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-980000-to-step-980200.mp4
--------------------------------------
| rollout/                |          |
|    success_rate         | 0        |
| time/                   |          |
|    fps                  | 324      |
|    iterations           | 479      |
|    time_elapsed         | 3027     |
|    total_timesteps      | 980992   |
| train/                  |          |
|    approx_kl            | 20.28061 |
|    clip_fraction        | 0.904    |
|    clip_range           | 0.2      |
|    entropy_loss         | -14.9    |
|    explained_variance   | 0.923    |
|    learning_rate        | 0.0003   |
|    loss                 | -0.0965  |
|    n_updates            | 4780     |
|    policy_gradient_loss | -0.0661  |
|    std                  | 0.511    |
|    value_loss           | 0.00474  |
--------------------------------------
------------------------------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-990000-to-step-990200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 324       |
|    iterations           | 484       |
|    time_elapsed         | 3059      |
|    total_timesteps      | 991232    |
| train/                  |           |
|    approx_kl            | 159.79828 |
|    clip_fraction        | 0.912     |
|    clip_range           | 0.2       |
|    entropy_loss         | -14.7     |
|    explained_variance   | 0.951     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.12     |
|    n_updates            | 4830      |
|    policy_gradient_loss | -0.0697   |
|    std                  | 0.508     |
|    value_loss           | 0.00371   |
---------------------------------------
---------

                                                                                                                       

MoviePy - Done !
MoviePy - video ready C:\Users\13233\Documents\Robotics Project\Dexterous-Manipulation\videos\rl-agent-step-1000000-to-step-1000200.mp4
---------------------------------------
| rollout/                |           |
|    success_rate         | 0         |
| time/                   |           |
|    fps                  | 324       |
|    iterations           | 489       |
|    time_elapsed         | 3090      |
|    total_timesteps      | 1001472   |
| train/                  |           |
|    approx_kl            | 19.913387 |
|    clip_fraction        | 0.9       |
|    clip_range           | 0.2       |
|    entropy_loss         | -14.6     |
|    explained_variance   | 0.968     |
|    learning_rate        | 0.0003    |
|    loss                 | -0.119    |
|    n_updates            | 4880      |
|    policy_gradient_loss | -0.0583   |
|    std                  | 0.504     |
|    value_loss           | 0.0045    |
---------------------------------------
