# Test Recurrent Policy with Extreme Parameter Variation 

In [1]:
import numpy as np
import os,sys



sys.path.append('../../../RL_lib/Agents')
sys.path.append('../../../RL_lib/Policies/PPO')
sys.path.append('../../../RL_lib/Policies/Common')
sys.path.append('../../../RL_lib/Utils')
sys.path.append('../../../Env')
sys.path.append('../../../Imaging')


%load_ext autoreload
%load_ext autoreload
%autoreload 2
%matplotlib nbagg
import os
print(os.getcwd())

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
/Users/briangaudet/Study/Subjects/MachineLearning/Projects/Asteroid_CPO_seeker-master/Experiments/Extended/Optimize_HF


In [2]:
%%html
<style>
.output_wrapper, .output {
    height:auto !important;
    max-height:1000px;  /* your desired max-height here */
}
.output_scroll {
    box-shadow:none !important;
    webkit-box-shadow:none !important;
}
</style>

# Optimize Policy

In [3]:
from env import Env
import env_utils as envu
from dynamics_model import Dynamics_model
from lander_model import Lander_model
from ic_gen import Landing_icgen
import rl_utils
import attitude_utils as attu
import optics_utils as optu
from arch_policy_vf import Arch

from policy_ppo import Policy
from softmax_pd import Softmax_pd as PD
from value_function import Value_function

import policy_nets as policy_nets
import valfunc_nets as valfunc_nets


from agent import Agent


import torch.nn as nn

from flat_constraint import Flat_constraint
from glideslope_constraint import Glideslope_constraint
from rh_constraint import RH_constraint
from no_attitude_constraint import Attitude_constraint
from w_constraint import W_constraint
from reward_attitude import Reward
from asteroid_hfr import Asteroid

from thruster_model_cubesat import Thruster_model

from sensor import Sensor
from seeker import Seeker

landing_site_range = 0.0
landing_site = None #np.asarray([-250.,0.,0.])

asteroid_model = Asteroid(landing_site_override=landing_site, omega_range=(1e-5,5e-4))

ap = attu.Quaternion_attitude()

C_cb = optu.rotate_optical_axis(0.0, 0.0, np.pi)
r_cb = np.asarray([0,0,0])
fov=envu.deg2rad(90)
seeker = Seeker(attitude_parameterization=ap, C_cb=C_cb, r_cb=r_cb,
                radome_slope_bounds=(-0.05,0.05), range_bias=(-0.05,0.05),
                   fov=fov, debug=False)
sensor = Sensor(seeker, attitude_parameterization=ap,  use_range=True, apf_tau1=300, use_dp=False,
                      landing_site_range=landing_site_range,
                      pool_type='max', state_type=Sensor.optflow_state_range_dp1)
print(sensor.track_func)
sensor.track_func = sensor.track_func1
print(sensor.track_func)
logger = rl_utils.Logger()
dynamics_model = Dynamics_model(h=2)
thruster_model = Thruster_model(pulsed=True, scale=1.0, offset=0.4)
lander_model = Lander_model(asteroid_model, thruster_model, attitude_parameterization=ap, sensor=sensor, 
                             landing_site_range=landing_site_range, com_range=(-0.10,0.10),
                              attitude_bias=0.05, omega_bias=0.05)

lander_model.get_state_agent = lander_model.get_state_agent_sensor_att_w2

obs_dim = 13
action_dim = 12
actions_per_dim = 2
logit_dim = action_dim * actions_per_dim

recurrent_steps = 60

reward_object = Reward(landing_rlimit=2, landing_vlimit=0.1, 
                       tracking_bias=0.01, fov_coeff=-50., 
                       att_coeff=-0.20,
                       tracking_coeff=-0.5, magv_coeff=-1.0,
                       fuel_coeff=-0.10,  landing_coeff=10.0)

glideslope_constraint = Glideslope_constraint(gs_limit=-1.0)
shape_constraint = Flat_constraint()
attitude_constraint = Attitude_constraint(ap)
w_constraint = W_constraint(w_limit=(0.1,0.1,0.1), w_margin=(0.05,0.05,0.05))
rh_constraint = RH_constraint(rh_limit=150)

wi=0.05
ic_gen = Landing_icgen((800,1000), 
                           p_engine_fail=0.5,
                           engine_fail_scale=(0.5,1.0),
                           lander_wll=(-wi,-wi,-wi),
                           lander_wul=(wi,wi,wi),
                           attitude_parameterization=ap,
                           position_error=(0,np.pi/4),
                           heading_error=(0,np.pi/8),
                           attitude_error=(0,np.pi/16),
                           min_mass=450, max_mass=500,
                           mag_v=(0.05,0.1),
                           debug=False,
                           inertia_uncertainty_diag=10.0,
                           inertia_uncertainty_offdiag=1.0)

env = Env(ic_gen, lander_model, dynamics_model, logger,
          landing_site_range=landing_site_range,
          debug_done=False,
          reward_object=reward_object,
          glideslope_constraint=glideslope_constraint,
          attitude_constraint=attitude_constraint,
          w_constraint=w_constraint,
          rh_constraint=rh_constraint,
          tf_limit=5000.0,print_every=10,nav_period=6)




env.ic_gen.show()

arch = Arch()

policy = Policy(policy_nets.GRU1(obs_dim, logit_dim, recurrent_steps=recurrent_steps), 
                PD(action_dim, actions_per_dim),
                shuffle=False,
                kl_targ=0.001,epochs=20, beta=0.1, servo_kl=True, max_grad_norm=30, scale_vector_obs=True,
                init_func=rl_utils.xn_init)
value_function = Value_function(valfunc_nets.GRU1(obs_dim, recurrent_steps=recurrent_steps), scale_obs=True,
                                shuffle=False, batch_size=9999999, max_grad_norm=30, 
                                verbose=False)

agent = Agent(arch, policy, value_function, None, env, logger,
              policy_episodes=30, policy_steps=3000, gamma1=0.95, gamma2=0.995, 
              recurrent_steps=recurrent_steps, monitor=env.rl_stats)
agent.train(120000)

Quaternion_attitude
Euler321 Attitude
C_cb: 
[[ 1.0000000e+00  0.0000000e+00 -0.0000000e+00]
 [ 0.0000000e+00 -1.0000000e+00  1.2246468e-16]
 [ 0.0000000e+00 -1.2246468e-16 -1.0000000e+00]]
[ 0.0000000e+00 -1.2246468e-16 -1.0000000e+00]
using max  pooling
V4: Output State type:  <function Sensor.optflow_state_range_dp1 at 0x138416488>
<bound method Sensor.track_func1 of <sensor.Sensor object at 0x1287796a0>>
<bound method Sensor.track_func1 of <sensor.Sensor object at 0x1287796a0>>
6dof dynamics model 
thruster model: 
Inertia Tensor:  [[333.33333333   0.           0.        ]
 [  0.         333.33333333   0.        ]
 [  0.           0.         333.33333333]]
Lander Model: 
Reward_terminal equator
queue fixed
Flat Constraint
Attitude Constraint
Rotational Velocity Constraint
Position Hysterises Constraint


<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

lander env RHL
Landing_icgen:
[[-1.]
 [ 1.]]
Policy with vectorized sample
	xn_init: layer  Linear(in_features=13, out_features=130, bias=True)
	xn_init: layer  GRUCell(130, 176)
	xn_init: layer  Linear(in_features=176, out_features=240, bias=True)
	xn_init: layer  Linear(in_features=240, out_features=24, bias=True)
Policy: recurrent steps > 1, disabling shuffle
	Test Mode:          False
	Clip Param:         0.1
	Shuffle :           False
	Shuffle by Chunks:  False
	Max Grad Norm:      30
	Recurrent Steps:    60
	Rollout Limit:      1
	Advantage Func:     <advantage_utils.Adv_default object at 0x1382bd240>
	Advantage Norm:     <function Adv_normalizer.apply at 0x137671488>
	PD:                 <softmax_pd.Softmax_pd object at 0x13a4a0ba8>
	Loss Function:      <bound method Policy.calc_loss1 of <policy_ppo.Policy object at 0x13a4b30f0>>
Value Funtion
	xn_init: layer  Linear(in_features=13, out_features=130, bias=True)
	xn_init: layer  GRUCell(130, 25)
	xn_init: layer  Linear(in_feature

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1173   0.0344   0.1774   0.1774   0.1295   0.0344
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2206   0.0237   0.2484   5.4889   2.1784   2.1397
***** Episode 223, Mean R = -238.4  Std R = 86.7  Min R = -405.3
PolicyLoss: -0.0116
Policy_Beta: 0.0444
Policy_Entropy: 0.000332
Policy_KL: 0.000897
Policy_SD: 0.954
Policy_lr_mult: 1
Steps: 3.76e+03
TotalSteps: 2.4e+04
VF_0_ExplainedVarNew: 0.0216
VF_0_ExplainedVarOld: 0.0206
VF_0_Loss : 0.898


ADV1:  -0.06480930332305872 0.9153590236027269 0.8904466092768225 -3.4133167711511394
ADV2:  0.01713531889570456 0.8913891200205232 0.9516296862364757 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1210   0.0292   0.1550   0.1774   0.1295   0.0344
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0896   0.0504   0.1797   5.4889   2.1784   2.1397
***** Episode 254, Mean R = -229.7  Std R = 95.6  Min R = -502.8
PolicyLoss: -0.00937
Policy_Beta: 0.0444
Policy_Entropy: 0.000332
Po

ADV1:  0.050496836482497955 0.42851568538421986 0.6234700811553036 -4.084933562738054
ADV2:  0.03046639843950102 0.6990090712037648 1.255259010702916 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0750   0.0184   0.0984   0.1874   0.1295   0.0344
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0864   0.0311   0.1306   5.4889   2.1784   2.1397
***** Episode 502, Mean R = -418.1  Std R = 166.4  Min R = -1038.6
PolicyLoss: -0.0506
Policy_Beta: 0.0444
Policy_Entropy: 0.000351
Policy_KL: 0.000503
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 9.16e+03
TotalSteps: 8.17e+04
VF_0_ExplainedVarNew: 0.179
VF_0_ExplainedVarOld: 0.153
VF_0_Loss : 0.234


*** RH VIO  CNT:  100
ADV1:  -0.0360718952531697 0.46391378911232345 0.4699704606602313 -3.9429890181086407
ADV2:  0.057209647265912794 0.6718128022659161 1.0363622504958665 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0703   0.0156   0.0966   0.1874   0.1295   0.0344
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0367

***** Episode 750, Mean R = -476.4  Std R = 204.5  Min R = -1088.9
PolicyLoss: -0.0238
Policy_Beta: 0.0667
Policy_Entropy: 0.000367
Policy_KL: 0.00105
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 1.14e+04
TotalSteps: 1.65e+05
VF_0_ExplainedVarNew: 0.551
VF_0_ExplainedVarOld: 0.504
VF_0_Loss : 0.0732


ADV1:  0.05497924290988992 0.26130705374908403 1.7616070531604533 -4.037419477105888
ADV2:  0.0018996039623441442 0.7779551676979026 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0785   0.0172   0.1082   0.1874   0.1295   0.0344
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0552   0.0307   0.1426   5.4889   2.1784   2.1397
***** Episode 781, Mean R = -490.7  Std R = 165.1  Min R = -938.1
PolicyLoss: -0.0249
Policy_Beta: 0.0667
Policy_Entropy: 0.000366
Policy_KL: 0.001
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 1.18e+04
TotalSteps: 1.77e+05
VF_0_ExplainedVarNew: 0.487
VF_0_ExplainedVarOld: 0.435
VF_0_Loss : 0.0919


ADV1:  0.01783622575165715 0.20329295196357966 1.433876

ADV1:  -0.042938198616974 0.25478460988904983 1.7742063983281453 -3.7295398362570698
ADV2:  0.04436561943401757 0.7001943556940466 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0704   0.0132   0.0880   0.1874   0.1295   0.0344
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0506   0.0242   0.1141   5.4889   2.1784   2.1397
***** Episode 1029, Mean R = -492.1  Std R = 165.5  Min R = -976.0
PolicyLoss: -0.0368
Policy_Beta: 0.0667
Policy_Entropy: 0.000375
Policy_KL: 0.000962
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 1.21e+04
TotalSteps: 2.71e+05
VF_0_ExplainedVarNew: 0.548
VF_0_ExplainedVarOld: 0.507
VF_0_Loss : 0.0861


ADV1:  0.021053795261444134 0.21061854876095842 1.907825060698836 -3.6512286953127164
ADV2:  0.003783044826511558 0.7805999172087986 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1003   0.0295   0.1655   0.1874   0.1295   0.0344
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0277   0.0140   0.0680   5.4889   2.1784   2.1397
*****

***** Episode 1277, Mean R = -483.1  Std R = 139.0  Min R = -724.1
PolicyLoss: -0.0124
Policy_Beta: 0.0667
Policy_Entropy: 0.000386
Policy_KL: 0.000835
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 1.18e+04
TotalSteps: 3.63e+05
VF_0_ExplainedVarNew: 0.779
VF_0_ExplainedVarOld: 0.754
VF_0_Loss : 0.0473


ADV1:  -0.012732108173998318 0.17798540612003752 1.4920101737976075 -3.1437345301210993
ADV2:  0.025434869033294675 0.7809948063608423 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1040   0.0258   0.1395   0.1874   0.1295   0.0344
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0243   0.0090   0.0451   5.4889   2.1784   2.1397
***** Episode 1308, Mean R = -490.5  Std R = 197.4  Min R = -970.0
PolicyLoss: -0.0246
Policy_Beta: 0.0667
Policy_Entropy: 0.000387
Policy_KL: 0.00108
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 1.18e+04
TotalSteps: 3.75e+05
VF_0_ExplainedVarNew: 0.741
VF_0_ExplainedVarOld: 0.715
VF_0_Loss : 0.053


*** RH VIO  CNT:  600
ADV1:  -0.005524389442559394

optical_flow |  0.0000 -0.0000 |  0.0019  0.0019 | -0.0104 -0.0226 |  0.0252  0.0115
v_err    | -0.4729 |  0.1607 | -1.1296 |  0.5220
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  910.97 |  238.05 |  155.96 | 1367.56
tracking_rewards | -400.39 |  162.13 | -911.63 | -153.89
steps    |     370 |     152 |     130 |     834
***** Episode 1587, Mean R = -423.9  Std R = 178.0  Min R = -993.8
PolicyLoss: -0.0156
Policy_Beta: 0.0667
Policy_Entropy: 0.000405
Policy_KL: 0.00112
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 1.02e+04
TotalSteps: 4.77e+05
VF_0_ExplainedVarNew: 0.78
VF_0_ExplainedVarOld: 0.725
VF_0_Loss : 0.0584


ADV1:  0.03671415081683631 0.168636749930977 1.6304986487550572 -1.2378225386111676
ADV2:  0.0017295869347589133 0.8739810790384859 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1197   0.0375   0.2072   0.2072   0.1329   0.0381
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0462   0.0246   0.1102   5.4889   2.1784   2.1397
***

attitude |   -0.04    0.01    0.02 |    1.75    0.68    1.81 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.08   -0.10   -0.08 |    0.08    0.09    0.08
a_f      |    0.09    0.08 |    0.69    1.84 |   -1.43   -3.14 |    1.40    3.12
w_f      |   -0.00   -0.00   -0.00 |    0.02    0.02    0.02 |   -0.07   -0.10   -0.06 |    0.05    0.05    0.06
w_rewards |   -1.31 |    1.36 |   -8.52 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |  -30.65 |   24.35 |  -50.00 |    0.00
theta_cv |    1.49 |    0.69 |    0.01 |    3.13
seeker_angles |    0.06    0.03 |    0.34    0.35 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0555  0.0258 |  0.3358  0.3522 | -0.9998 -1.0000 |  1.0000  0.9999
optical_flow |  0.0007  0.0002 |  0.0029  0.0025 | -0.0484 -0.0366 |  0.1697  0.0469
v_err    | -0.3800 |  0.1955 | -1.1552 |  1.0565
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  723

w        |   -0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.08   -0.08   -0.08 |    0.08    0.08    0.09
a_f      |    0.08   -0.23 |    0.65    1.75 |   -1.39   -3.13 |    1.44    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.08   -0.07   -0.06 |    0.05    0.06    0.06
w_rewards |   -0.47 |    0.53 |   -2.70 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.16 |   14.78 |  -50.00 |    0.00
theta_cv |    1.18 |    0.62 |    0.00 |    3.13
seeker_angles |    0.06    0.03 |    0.35    0.35 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0554  0.0348 |  0.3479  0.3452 | -0.9999 -0.9997 |  0.9999  1.0000
optical_flow |  0.0011  0.0003 |  0.0040  0.0039 | -0.1184 -0.1441 |  0.0809  0.0542
v_err    | -0.2029 |  0.2271 | -1.1536 |  1.0051
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  504.95 |  229.82 |   22.88 | 1209.52
tracking_rewards | -220.03 |   81.99 | -626.67 | -105.12
steps    |     291 |  

attitude |   -0.04   -0.02   -0.04 |    1.41    0.67    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.08   -0.07   -0.08 |    0.07    0.07    0.07
a_f      |   -0.03   -0.04 |    0.66    1.81 |   -1.52   -3.13 |    1.46    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
w_rewards |   -0.13 |    0.23 |   -1.41 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.81 |   13.86 |  -50.00 |    0.00
theta_cv |    0.92 |    0.49 |    0.00 |    3.11
seeker_angles |    0.01    0.02 |    0.34    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0069  0.0224 |  0.3446  0.3232 | -0.9996 -0.9994 |  1.0000  0.9999
optical_flow |  0.0007  0.0001 |  0.0049  0.0043 | -0.1036 -0.0549 |  0.1179  0.0506
v_err    | -0.0917 |  0.2384 | -1.4010 |  1.0294
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  418

attitude |   -0.02   -0.01   -0.09 |    1.27    0.66    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.07   -0.07   -0.07 |    0.06    0.07    0.07
a_f      |   -0.04    0.02 |    0.67    1.88 |   -1.53   -3.12 |    1.46    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.05   -0.04   -0.04 |    0.05    0.05    0.05
w_rewards |   -0.07 |    0.12 |   -0.85 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.81 |   13.86 |  -50.00 |    0.00
theta_cv |    0.73 |    0.39 |    0.00 |    2.94
seeker_angles |    0.03    0.01 |    0.35    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0260  0.0125 |  0.3501  0.3375 | -0.9997 -0.9995 |  0.9998  0.9998
optical_flow |  0.0010  0.0003 |  0.0052  0.0047 | -0.0554 -0.1437 |  0.1463  0.1517
v_err    | -0.0468 |  0.2094 | -1.3324 |  0.9543
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  381

attitude |    0.05   -0.05    0.00 |    1.25    0.67    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.07   -0.06   -0.06 |    0.06    0.06    0.07
a_f      |   -0.03   -0.07 |    0.67    1.79 |   -1.47   -3.13 |    1.49    3.12
w_f      |   -0.00   -0.00    0.00 |    0.01    0.01    0.02 |   -0.05   -0.04   -0.05 |    0.04    0.04    0.04
w_rewards |   -0.03 |    0.06 |   -0.40 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.65 |   14.10 |  -50.00 |    0.00
theta_cv |    0.64 |    0.34 |    0.00 |    2.29
seeker_angles |    0.06    0.03 |    0.36    0.31 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0568  0.0299 |  0.3622  0.3126 | -0.9995 -1.0000 |  0.9997  0.9999
optical_flow |  0.0014  0.0003 |  0.0053  0.0049 | -0.0445 -0.1098 |  0.0679  0.0831
v_err    | -0.0261 |  0.1683 | -0.5666 |  0.7739
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  359

w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -47.74 |   10.38 |  -50.00 |    0.00
theta_cv |    0.59 |    0.31 |    0.00 |    2.32
seeker_angles |    0.03    0.04 |    0.37    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0342  0.0356 |  0.3656  0.3265 | -0.9999 -0.9997 |  1.0000  0.9998
optical_flow |  0.0010  0.0003 |  0.0055  0.0048 | -0.0456 -0.1069 |  0.0688  0.0513
v_err    | -0.0253 |  0.1362 | -0.6420 |  0.6393
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  332.31 |  150.88 |   14.39 |  815.15
tracking_rewards |  -96.57 |   18.89 | -149.54 |  -57.17
steps    |     238 |      39 |     140 |     355
***** Episode 3447, Mean R = -156.7  Std R = 18.6  Min R = -200.9
PolicyLoss: -0.0268
Policy_Beta: 0.0667
Policy_Entropy: 0.00123
Policy_KL: 0.00106
Policy_SD: 0.958
Policy_lr_mult: 1
Steps: 7.7e+03
TotalSteps: 9.8e+05
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.959
VF_0_Loss : 0.11


ADV1:  0.008032099744487462 0.085190

attitude |    0.05    0.05    0.08 |    1.34    0.69    1.93 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.06 |    0.06    0.06    0.05
a_f      |    0.04   -0.06 |    0.71    1.89 |   -1.51   -3.14 |    1.47    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.04 |    0.04    0.05    0.04
w_rewards |   -0.01 |    0.02 |   -0.12 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -48.71 |    7.93 |  -50.00 |    0.00
theta_cv |    0.55 |    0.29 |    0.00 |    1.88
seeker_angles |    0.01   -0.00 |    0.36    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0098 -0.0023 |  0.3572  0.3188 | -0.9997 -1.0000 |  0.9999  0.9999
optical_flow |  0.0005  0.0000 |  0.0059  0.0056 | -0.0509 -0.0991 |  0.1790  0.1405
v_err    | -0.0246 |  0.1189 | -0.5622 |  0.6306
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  283

theta_cv |    0.54 |    0.28 |    0.00 |    2.29
seeker_angles |   -0.03    0.05 |    0.34    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0333  0.0456 |  0.3417  0.3246 | -0.9995 -0.9995 |  1.0000  0.9999
optical_flow |  0.0004  0.0002 |  0.0068  0.0067 | -0.1586 -0.2263 |  0.1320  0.0859
v_err    | -0.0264 |  0.1078 | -0.6246 |  0.6562
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  250.55 |  139.76 |    8.99 |  623.19
tracking_rewards |  -87.63 |   18.97 | -154.03 |  -49.05
steps    |     260 |      46 |     154 |     364
***** Episode 4067, Mean R = -144.1  Std R = 22.2  Min R = -202.0
PolicyLoss: 0.0175
Policy_Beta: 0.0667
Policy_Entropy: 0.00182
Policy_KL: 0.00105
Policy_SD: 0.957
Policy_lr_mult: 1
Steps: 7.92e+03
TotalSteps: 1.14e+06
VF_0_ExplainedVarNew: 0.911
VF_0_ExplainedVarOld: 0.898
VF_0_Loss : 0.112


ADV1:  0.007525228021886782 0.13449132908300948 1.9821672121683755 -0.9708150540769798
ADV2:  -0.03459221110422022 0.6286370322335948 3.

glideslope |    4.19 |   17.45 |    0.01 |  177.09
norm_af  |    1.73 |    0.87 |    0.03 |    3.24
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.02   -0.03    0.08 |    1.21    0.69    1.79 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.06   -0.06 |    0.06    0.06    0.06
a_f      |   -0.05    0.11 |    0.67    1.81 |   -1.44   -3.14 |    1.42    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.04 |    0.03    0.04    0.05
w_rewards |   -0.00 |    0.02 |   -0.15 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -48.06 |    9.65 |  -50.00 |    0.00
theta_cv |    0.53 |    0.28 |    0.00 |    2.78
seeker_angles |   -0.04    0.03 |    0.32    0.32 |   -1.00   -1.00 |    1.

attitude |   -0.02   -0.01    0.08 |    1.11    0.64    1.79 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.06 |    0.05    0.06    0.06
a_f      |    0.02    0.27 |    0.64    1.74 |   -1.37   -3.06 |    1.52    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.04 |    0.04    0.04    0.04
w_rewards |   -0.00 |    0.01 |   -0.12 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -48.23 |    9.25 |  -50.00 |    0.00
theta_cv |    0.54 |    0.28 |    0.00 |    2.46
seeker_angles |   -0.04    0.02 |    0.33    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0386  0.0226 |  0.3323  0.3309 | -1.0000 -0.9999 |  1.0000  0.9998
optical_flow | -0.0002  0.0001 |  0.0086  0.0087 | -0.2605 -0.1552 |  0.2361  0.3554
v_err    | -0.0253 |  0.0989 | -0.4818 |  0.7386
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  206

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.06   -0.05 |    0.05    0.05    0.07
a_f      |   -0.01    0.01 |    0.69    1.82 |   -1.40   -3.14 |    1.51    3.11
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.04    0.04
w_rewards |   -0.00 |    0.02 |   -0.17 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -47.90 |   10.02 |  -50.00 |    0.00
theta_cv |    0.55 |    0.30 |    0.00 |    2.27
seeker_angles |   -0.04    0.04 |    0.33    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0439  0.0355 |  0.3262  0.3181 | -0.9999 -1.0000 |  1.0000  1.0000
optical_flow | -0.0001  0.0005 |  0.0092  0.0090 | -0.1546 -0.2207 |  0.2688  0.3452
v_err    | -0.0252 |  0.0962 | -0.6675 |  0.6551
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  185.64 |  125.86 |    5.51 |  563.82
tracking_rewards |  -84.80 |   18.06 | -149.89 |  -47.37
steps    |     284 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.06 |    0.05    0.06    0.06
a_f      |    0.00    0.02 |    0.68    1.87 |   -1.50   -3.14 |    1.56    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.04    0.04
w_rewards |   -0.00 |    0.01 |   -0.13 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -47.10 |   11.69 |  -50.00 |    0.00
theta_cv |    0.56 |    0.30 |    0.00 |    2.38
seeker_angles |   -0.04    0.00 |    0.32    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0365  0.0033 |  0.3227  0.3291 | -0.9999 -0.9998 |  0.9999  0.9997
optical_flow |  0.0001  0.0000 |  0.0092  0.0094 | -0.1857 -0.1596 |  0.3139  0.3705
v_err    | -0.0255 |  0.0944 | -0.4678 |  0.6399
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  194.21 |  133.95 |    7.83 |  543.43
tracking_rewards |  -83.49 |   19.64 | -150.97 |  -44.19
steps    |     283 |  

attitude |    0.07   -0.01   -0.14 |    1.20    0.65    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.06 |    0.66    1.85 |   -1.41   -3.12 |    1.49    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.03    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.32 |   14.56 |  -50.00 |    0.00
theta_cv |    0.55 |    0.30 |    0.00 |    2.84
seeker_angles |   -0.03   -0.02 |    0.31    0.31 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0314 -0.0235 |  0.3128  0.3141 | -0.9998 -1.0000 |  0.9998  0.9997
optical_flow |  0.0002  0.0000 |  0.0094  0.0102 | -0.2366 -0.2154 |  0.1664  0.3813
v_err    | -0.0222 |  0.0935 | -0.4768 |  0.5884
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  170

glideslope |    3.76 |   17.51 |    0.01 | 2204.04
norm_af  |    1.72 |    0.88 |    0.13 |    3.39
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.05   -0.04   -0.03 |    1.21    0.68    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.06   -0.05 |    0.05    0.06    0.05
a_f      |   -0.03   -0.02 |    0.66    1.82 |   -1.50   -3.13 |    1.39    3.11
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.05   -0.03 |    0.03    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.81 |   13.86 |  -50.00 |    0.00
theta_cv |    0.58 |    0.32 |    0.00 |    2.57
seeker_angles |   -0.04   -0.03 |    0.32    0.33 |   -1.00   -1.00 |    1.

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.06   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04    0.17 |    0.65    1.87 |   -1.43   -3.14 |    1.49    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.03    0.04    0.03
w_rewards |   -0.00 |    0.01 |   -0.09 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.81 |   13.86 |  -50.00 |    0.00
theta_cv |    0.59 |    0.32 |    0.00 |    2.67
seeker_angles |   -0.04   -0.01 |    0.32    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0399 -0.0142 |  0.3162  0.3192 | -0.9993 -1.0000 |  0.9992  1.0000
optical_flow |  0.0001 -0.0000 |  0.0101  0.0106 | -0.1582 -0.1297 |  0.3484  0.7225
v_err    | -0.0219 |  0.0899 | -0.4828 |  0.8092
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  150.93 |  101.52 |    1.05 |  557.23
tracking_rewards |  -84.18 |   18.09 | -138.42 |  -47.60
steps    |     304 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.06    0.05
a_f      |    0.05    0.17 |    0.67    1.86 |   -1.50   -3.14 |    1.48    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.10 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -44.52 |   15.62 |  -50.00 |    0.00
theta_cv |    0.58 |    0.32 |    0.00 |    2.43
seeker_angles |   -0.04   -0.02 |    0.31    0.31 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0420 -0.0188 |  0.3108  0.3076 | -0.9997 -0.9993 |  0.9999  0.9997
optical_flow |  0.0001  0.0001 |  0.0103  0.0112 | -0.1915 -0.2470 |  0.2114  0.4603
v_err    | -0.0210 |  0.0886 | -0.4701 |  0.6257
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  148.35 |  110.26 |   12.06 |  512.33
tracking_rewards |  -80.90 |   17.12 | -129.49 |  -45.97
steps    |     303 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01    0.09 |    0.69    1.79 |   -1.32   -3.12 |    1.41    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.32 |   14.56 |  -50.00 |    0.00
theta_cv |    0.60 |    0.32 |    0.00 |    2.60
seeker_angles |   -0.04   -0.03 |    0.31    0.31 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0416 -0.0320 |  0.3118  0.3065 | -0.9993 -0.9996 |  0.9999  0.9996
optical_flow |  0.0003 -0.0000 |  0.0110  0.0111 | -0.3499 -0.1709 |  0.3026  0.3078
v_err    | -0.0227 |  0.0879 | -1.6857 |  0.8903
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  138.91 |  104.49 |    7.66 |  742.34
tracking_rewards |  -81.30 |   16.77 | -133.24 |  -43.03
steps    |     308 |  

norm_thrust |    1.58 |    0.68 |    0.00 |    3.46
fuel     |    4.46 |    0.75 |    2.08 |    5.69
rewards  | -137.50 |   20.50 | -207.38 |  -73.12
fuel_rewards |  -12.77 |    2.14 |  -16.27 |   -5.95
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.65 |   15.73 |    0.01 |  472.70
norm_af  |    1.69 |    0.90 |    0.06 |    3.41
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.06   -0.05   -0.18 |    1.13    0.62    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.04   -0.15 |    0.62    1.81 |   -1.41   -3.12 |    1.49    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0247   0.0112   0.0464   5.4889   2.1784   2.1397
Update Cnt = 240    ET =    977.7   Stats:  Mean, Std, Min, Max
r_f      |  -10.36   18.67    5.93 |  235.81  210.50  269.33 | -736.46 -564.33 -716.82 |  661.93  704.99  741.12
v_f      |   -0.01    0.01   -0.02 |    0.34    0.37    0.38 |   -1.18   -1.01   -1.49 |    0.90    0.97    0.95
r_i      |   -8.52   40.68  -11.70 |  673.04  617.03  805.82 |-1306.22-1244.76-1308.35 | 1273.29 1320.11 1320.78
v_i      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.10   -0.10 |    0.10    0.08    0.10
norm_rf  |  134.89 |   93.43 |    4.39 |  472.01
norm_vf  |    0.59 |    0.22 |    0.22 |    1.72
gs_f     |    1.04 |    1.42 |    0.02 |   14.64
thrust   |    0.00   -0.00   -0.00 |    0.99    1.00    1.00 |   -3.42   -3.42   -3.45 |    3.46    3.39    3.43
norm_thrust |    1.59 |    0.68 |    0.00 |    3.46
fuel     |    4.52 |    0.63 |    2.23 |    5.79
rewards  | -138.23 |

ADV1:  -0.009664514660991944 0.13321188854716562 1.1112339242173688 -1.2431650177637756
ADV2:  0.016293211449341958 0.7477225920106162 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3292   0.0698   0.4972   1.3611   0.5735   0.2833
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0206   0.0064   0.0350   5.4889   2.1784   2.1397
***** Episode 7756, Mean R = -144.3  Std R = 14.4  Min R = -168.7
PolicyLoss: -0.0146
Policy_Beta: 0.0667
Policy_Entropy: 0.00546
Policy_KL: 0.000862
Policy_SD: 0.954
Policy_lr_mult: 1
Steps: 1.01e+04
TotalSteps: 2.23e+06
VF_0_ExplainedVarNew: 0.929
VF_0_ExplainedVarOld: 0.893
VF_0_Loss : 0.119


ADV1:  0.002109026647134351 0.12044410830976678 1.376494107246399 -1.3493617200851462
ADV2:  -0.01043222875459404 0.7372354139895556 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3807   0.1164   0.7320   1.3611   0.5735   0.2833
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0144   0.0040   0.0211   5.4889   2.1784   2.1397
Upda

ADV1:  -0.010246528790839862 0.21598402299472708 1.794432339668274 -3.7792227579424864
ADV2:  0.02324647995047948 0.6288270025309209 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3572   0.0768   0.4880   1.3611   0.5735   0.2833
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0264   0.0082   0.0465   5.4889   2.1784   2.1397
***** Episode 8035, Mean R = -142.7  Std R = 19.6  Min R = -227.2
PolicyLoss: -0.0238
Policy_Beta: 0.0667
Policy_Entropy: 0.0061
Policy_KL: 0.00103
Policy_SD: 0.954
Policy_lr_mult: 1
Steps: 9.89e+03
TotalSteps: 2.32e+06
VF_0_ExplainedVarNew: 0.84
VF_0_ExplainedVarOld: 0.744
VF_0_Loss : 0.172


ADV1:  0.016547093871969232 0.1850462304477287 2.242373612721761 -0.8304564204045726
ADV2:  -0.048314186695548385 0.6797065614432123 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4146   0.1248   0.6020   1.3611   0.5735   0.2833
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0431   0.0148   0.0884   5.4889   2.1784   2.1397
***** Epi

Dynamics: Max Disturbance (m/s^2):  [0.00118983 0.00181235 0.00221757] 0.003101278765112381
ADV1:  -0.0011336972180269317 0.1432971650271722 1.0844939671316352 -1.6697202870074759
ADV2:  0.012609561650323915 0.7566357138567402 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4641   0.1194   0.7415   1.3611   0.5735   0.2833
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0236   0.0044   0.0326   5.4889   2.1784   2.1397
***** Episode 8314, Mean R = -143.3  Std R = 17.6  Min R = -191.8
PolicyLoss: -0.0163
Policy_Beta: 0.0667
Policy_Entropy: 0.00633
Policy_KL: 0.000883
Policy_SD: 0.954
Policy_lr_mult: 1
Steps: 9.79e+03
TotalSteps: 2.4e+06
VF_0_ExplainedVarNew: 0.907
VF_0_ExplainedVarOld: 0.874
VF_0_Loss : 0.208


ADV1:  0.016514085811584287 0.13811668694043255 2.1405059973398846 -1.0352607981363953
ADV2:  -0.018514915280493382 0.7505692371908878 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4490   0.1402   0.7858   1.3611   0.5735   0.2833
ValFun  Gradie

ADV1:  0.010921004202391553 0.14197449778161425 1.9701858612906016 -1.168352009455365
ADV2:  -0.0174280314825555 0.7428699544619589 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3460   0.0784   0.5230   1.4664   0.7138   0.2972
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0248   0.0113   0.0445   5.4889   2.1784   2.1397
***** Episode 8593, Mean R = -135.2  Std R = 14.4  Min R = -167.9
PolicyLoss: 0.00815
Policy_Beta: 0.0667
Policy_Entropy: 0.00668
Policy_KL: 0.000939
Policy_SD: 0.951
Policy_lr_mult: 1
Steps: 9.41e+03
TotalSteps: 2.49e+06
VF_0_ExplainedVarNew: 0.91
VF_0_ExplainedVarOld: 0.877
VF_0_Loss : 0.165


Dynamics: Max Disturbance (m/s^2):  [0.00118983 0.00181235 0.00221757] 0.003101278765112381
ADV1:  0.004654709176619674 0.145975134952341 1.9832707627614339 -0.7440308393988802
ADV2:  -0.029580176987212957 0.7346358133914707 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4322   0.1415   0.8368   1.4664   0.7138   0.2972
ValFun  Gradients: 

ADV1:  0.008901278616948989 0.18980303474925275 2.393110154469808 -1.7230371260643027
ADV2:  -0.027058470217914996 0.7040580133838303 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4983   0.1768   1.0194   1.4664   0.7138   0.2972
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0270   0.0107   0.0413   5.4889   2.1784   2.1397
***** Episode 8872, Mean R = -136.9  Std R = 26.7  Min R = -194.1
PolicyLoss: 0.0224
Policy_Beta: 0.0667
Policy_Entropy: 0.00723
Policy_KL: 0.000937
Policy_SD: 0.951
Policy_lr_mult: 1
Steps: 1.01e+04
TotalSteps: 2.58e+06
VF_0_ExplainedVarNew: 0.795
VF_0_ExplainedVarOld: 0.746
VF_0_Loss : 0.132


ADV1:  -0.044415646836580835 0.1499345587501249 0.7177829482543169 -1.8708683864275635
ADV2:  0.053278952461671095 0.7893482810291389 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3316   0.9317   2.9177   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0559   0.0262   0.1153   5.4889   2.1784   2.1397
*****

ADV1:  -0.0075925558104550294 0.13459344235086138 2.224185669673631 -1.178853098970479
ADV2:  0.017926959072329603 0.7110702883725897 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3555   0.1071   0.6842   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0158   0.0059   0.0262   5.4889   2.1784   2.1397
***** Episode 9151, Mean R = -133.1  Std R = 18.3  Min R = -188.0
PolicyLoss: -0.017
Policy_Beta: 0.0667
Policy_Entropy: 0.00744
Policy_KL: 0.00093
Policy_SD: 0.948
Policy_lr_mult: 1
Steps: 1.03e+04
TotalSteps: 2.67e+06
VF_0_ExplainedVarNew: 0.918
VF_0_ExplainedVarOld: 0.889
VF_0_Loss : 0.167


ADV1:  0.021768656267448984 0.13782735138585506 2.1774490451812745 -1.4715730571746848
ADV2:  -0.023316277507402738 0.7635659721902014 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2780   0.0825   0.5646   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0267   0.0136   0.0608   5.4889   2.1784   2.1397
*****

ADV1:  0.024161552564658142 0.199481905367531 2.1897171115875245 -1.5552342565854413
ADV2:  -0.045165378653487465 0.6896128720734863 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4947   0.1111   0.8156   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0470   0.0157   0.0881   5.4889   2.1784   2.1397
***** Episode 9430, Mean R = -130.1  Std R = 27.3  Min R = -171.2
PolicyLoss: 0.0364
Policy_Beta: 0.0667
Policy_Entropy: 0.00739
Policy_KL: 0.000959
Policy_SD: 0.947
Policy_lr_mult: 1
Steps: 1.04e+04
TotalSteps: 2.76e+06
VF_0_ExplainedVarNew: 0.819
VF_0_ExplainedVarOld: 0.723
VF_0_Loss : 0.0947


ADV1:  -0.030592977245611087 0.1865654598302092 2.24394500096639 -1.9228661318986253
ADV2:  0.019435629525198415 0.6842755004225036 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3522   0.1104   0.5498   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0547   0.0222   0.0897   5.4889   2.1784   2.1397
***** E

ADV1:  0.00761677893422157 0.17276042984984397 2.193659521629689 -1.1149161882560596
ADV2:  -0.03385660596339483 0.6921306632384583 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3423   0.1284   0.6271   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0198   0.0109   0.0615   5.4889   2.1784   2.1397
***** Episode 9709, Mean R = -129.6  Std R = 24.5  Min R = -164.6
PolicyLoss: 0.0299
Policy_Beta: 0.0667
Policy_Entropy: 0.00742
Policy_KL: 0.000893
Policy_SD: 0.947
Policy_lr_mult: 1
Steps: 1.06e+04
TotalSteps: 2.85e+06
VF_0_ExplainedVarNew: 0.844
VF_0_ExplainedVarOld: 0.796
VF_0_Loss : 0.0892


ADV1:  -0.009149495019738468 0.18047080507020324 2.1019846185048423 -1.2495057598749817
ADV2:  -0.014970231843048491 0.7297672537756725 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5041   0.2092   1.1170   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0218   0.0118   0.0536   5.4889   2.1784   2.1397
****

ADV1:  -0.02945947090522738 0.16177933449140763 1.8413206626043472 -1.503114380441076
ADV2:  0.023107173428051537 0.7565519505407078 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6172   0.2784   1.5669   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0377   0.0159   0.0761   5.4889   2.1784   2.1397
***** Episode 9988, Mean R = -130.7  Std R = 19.7  Min R = -173.7
PolicyLoss: -0.0109
Policy_Beta: 0.0667
Policy_Entropy: 0.00832
Policy_KL: 0.00121
Policy_SD: 0.944
Policy_lr_mult: 1
Steps: 1.01e+04
TotalSteps: 2.94e+06
VF_0_ExplainedVarNew: 0.887
VF_0_ExplainedVarOld: 0.828
VF_0_Loss : 0.147


ADV1:  0.007307035319397753 0.1362777081977229 1.9140640179316202 -1.7104740166664145
ADV2:  -0.004424778404236587 0.7319578778499497 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3697   0.1131   0.6609   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0144   0.0049   0.0258   5.4889   2.1784   2.1397
***** 

optical_flow | -0.0003  0.0001 |  0.0158  0.0143 | -0.5562 -0.4668 |  0.8107  0.5902
v_err    | -0.0174 |  0.0774 | -0.5053 |  0.6918
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |   80.22 |   91.45 |    0.04 |  493.89
tracking_rewards |  -74.25 |   14.72 | -121.73 |  -40.06
steps    |     329 |      40 |     160 |     406
***** Episode 10267, Mean R = -131.0  Std R = 25.4  Min R = -174.3
PolicyLoss: -0.00332
Policy_Beta: 0.0667
Policy_Entropy: 0.00838
Policy_KL: 0.00109
Policy_SD: 0.941
Policy_lr_mult: 1
Steps: 1.02e+04
TotalSteps: 3.03e+06
VF_0_ExplainedVarNew: 0.854
VF_0_ExplainedVarOld: 0.818
VF_0_Loss : 0.152


ADV1:  -0.00278094700954348 0.15960128900244147 1.5487270339330037 -1.2289792770184689
ADV2:  -0.013505420364101045 0.7435129327548263 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4740   0.1371   0.7882   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0166   0.0033   0.0205   5.4889   2.1784   2.1397


w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.00   -0.07 |    0.63    1.81 |   -1.46   -3.13 |    1.35    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.05    0.05    0.03
w_rewards |   -0.00 |    0.05 |   -0.80 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -43.55 |   16.76 |  -50.00 |    0.00
theta_cv |    0.60 |    0.31 |    0.00 |    3.06
seeker_angles |   -0.05   -0.01 |    0.29    0.27 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0495 -0.0133 |  0.2866  0.2700 | -1.0000 -0.9996 |  0.9994  0.9999
optical_flow | -0.0005  0.0003 |  0.0160  0.0155 | -0.3777 -0.5521 |  0.8935  0.5853
v_err    | -0.0169 |  0.0770 | -0.5180 |  0.7024
landing_rewards |    0.06 |    0.80 |    0.00 |   10.00
landing_margin |   75.62 |   94.23 |   -0.05 |  511.21
tracking_rewards |  -73.12 |   15.88 | -141.92 |  -39.60
steps    |     328 |  

w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.01    0.02 |    0.64    1.82 |   -1.50   -3.13 |    1.46    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.03   -0.03 |    0.06    0.04    0.02
w_rewards |   -0.00 |    0.03 |   -0.47 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -42.58 |   17.77 |  -50.00 |    0.00
theta_cv |    0.59 |    0.30 |    0.00 |    2.89
seeker_angles |   -0.04   -0.01 |    0.28    0.27 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0386 -0.0148 |  0.2813  0.2689 | -0.9998 -0.9992 |  0.9997  0.9995
optical_flow | -0.0003 -0.0001 |  0.0167  0.0157 | -0.3726 -0.6268 |  0.7333  0.5771
v_err    | -0.0156 |  0.0751 | -0.5006 |  0.5293
landing_rewards |    0.06 |    0.80 |    0.00 |   10.00
landing_margin |   64.83 |   85.29 |   -0.04 |  523.05
tracking_rewards |  -72.99 |   13.90 | -113.62 |  -41.51
steps    |     333 |  

attitude |    0.05   -0.05   -0.15 |    1.23    0.65    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.03   -0.14 |    0.67    1.87 |   -1.51   -3.12 |    1.37    3.11
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.08   -0.04   -0.03 |    0.06    0.04    0.04
w_rewards |   -0.00 |    0.04 |   -0.53 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -40.16 |   19.88 |  -50.00 |    0.00
theta_cv |    0.57 |    0.30 |    0.00 |    3.12
seeker_angles |   -0.03   -0.01 |    0.26    0.25 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0345 -0.0086 |  0.2643  0.2549 | -0.9998 -0.9995 |  0.9988  0.9997
optical_flow | -0.0002  0.0002 |  0.0180  0.0179 | -0.5262 -0.7218 |  1.4888  0.7432
v_err    | -0.0147 |  0.0739 | -0.4986 |  0.4855
landing_rewards |    0.23 |    1.49 |    0.00 |   10.00
landing_margin |   47

w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.07   -0.07 |    0.07    0.07    0.05
a_f      |    0.09   -0.06 |    0.63    1.87 |   -1.38   -3.13 |    1.47    3.12
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.07    0.04    0.04
w_rewards |   -0.02 |    0.21 |   -3.16 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -37.74 |   21.51 |  -50.00 |    0.00
theta_cv |    0.59 |    0.30 |    0.00 |    2.90
seeker_angles |   -0.03    0.00 |    0.27    0.26 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0347  0.0036 |  0.2676  0.2610 | -0.9993 -0.9991 |  1.0000  0.9995
optical_flow | -0.0006  0.0000 |  0.0175  0.0179 | -0.4745 -0.5207 |  1.0013  0.6453
v_err    | -0.0139 |  0.0783 | -0.5046 |  1.3972
landing_rewards |    0.32 |    1.77 |    0.00 |   10.00
landing_margin |   43.92 |   62.00 |   -0.05 |  461.21
tracking_rewards |  -72.33 |   16.27 | -139.76 |  -34.46
steps    |     342 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.07    0.05    0.05
a_f      |    0.01    0.05 |    0.67    1.82 |   -1.40   -3.13 |    1.54    3.12
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.03   -0.05 |    0.07    0.05    0.04
w_rewards |   -0.00 |    0.01 |   -0.21 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -36.61 |   22.14 |  -50.00 |    0.00
theta_cv |    0.57 |    0.29 |    0.00 |    2.66
seeker_angles |   -0.04    0.00 |    0.26    0.25 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0389  0.0032 |  0.2606  0.2550 | -0.9995 -1.0000 |  0.9998  0.9995
optical_flow | -0.0002  0.0001 |  0.0197  0.0193 | -0.8781 -1.2316 |  0.7395  1.2442
v_err    | -0.0158 |  0.0747 | -0.4982 |  1.1839
landing_rewards |    0.48 |    2.15 |    0.00 |   10.00
landing_margin |   39.92 |   62.25 |   -0.07 |  520.28
tracking_rewards |  -71.90 |   15.06 | -116.25 |  -40.03
steps    |     348 |  

attitude |    0.05   -0.04   -0.06 |    1.09    0.67    1.76 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.00   -0.05 |    0.69    1.76 |   -1.57   -3.12 |    1.50    3.12
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.07   -0.03   -0.04 |    0.06    0.04    0.04
w_rewards |   -0.00 |    0.02 |   -0.27 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -32.58 |   23.82 |  -50.00 |    0.00
theta_cv |    0.57 |    0.29 |    0.00 |    2.99
seeker_angles |   -0.04   -0.01 |    0.26    0.24 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0441 -0.0094 |  0.2603  0.2425 | -0.9994 -0.9999 |  0.9995  0.9966
optical_flow | -0.0004 -0.0001 |  0.0205  0.0208 | -0.8585 -0.7948 |  0.8054  1.1798
v_err    | -0.0167 |  0.0730 | -0.5283 |  0.5802
landing_rewards |    1.00 |    3.00 |    0.00 |   10.00
landing_margin |   31

thrust   |    0.01   -0.00   -0.00 |    0.99    0.98    0.99 |   -3.39   -3.46   -3.32 |    3.37    3.44    3.46
norm_thrust |    1.56 |    0.69 |    0.00 |    3.46
fuel     |    4.49 |    0.44 |    2.25 |    5.44
rewards  | -111.14 |   36.57 | -184.53 |  -36.94
fuel_rewards |  -12.85 |    1.26 |  -15.57 |   -6.42
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.14 |   14.20 |    0.01 |  438.16
norm_af  |    1.73 |    0.90 |    0.08 |    3.30
norm_wf  |    0.02 |    0.01 |    0.00 |    0.09
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.05   -0.01   -0.03 |    1.16    0.67    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.02    0.06 |    0.68

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5629   0.1422   1.0241   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0479   0.0234   0.0982   5.4889   2.1784   2.1397
Update Cnt = 410    ET =    922.6   Stats:  Mean, Std, Min, Max
r_f      |  -13.78   15.51   -3.88 |  191.24  183.20  210.99 | -404.20 -394.47 -719.34 |  435.49  573.72  397.05
v_f      |    0.01   -0.00    0.01 |    0.20    0.22    0.21 |   -0.72   -0.85   -0.58 |    0.86    0.91    0.81
r_i      |  -20.01   56.77   -1.48 |  652.20  667.86  786.19 |-1283.37-1261.24-1326.81 | 1211.88 1325.44 1378.60
v_i      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.08   -0.09 |    0.09    0.09    0.09
norm_rf  |   22.29 |   45.75 |    0.09 |  394.16
norm_vf  |    0.28 |    0.22 |    0.02 |    1.17
gs_f     |    1.09 |    1.26 |    0.04 |    9.22
thrust   |   -0.00   -0.00    0.00 |    0.99    0.97    0.98 |   -3.39   -3.46   -3.45 |    3.36    3.46    3.44
norm_thrust |    1

ADV1:  -0.0029260612823961366 0.15323709841369088 1.4635890726668417 -2.152265104452771
ADV2:  0.006192955857013673 0.6714561445756452 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4664   0.1400   0.6984   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0167   0.0054   0.0309   5.4889   2.1784   2.1397
***** Episode 13026, Mean R = -96.3  Std R = 41.2  Min R = -155.5
PolicyLoss: -0.00782
Policy_Beta: 0.0667
Policy_Entropy: 0.0111
Policy_KL: 0.000868
Policy_SD: 0.926
Policy_lr_mult: 1
Steps: 1.12e+04
TotalSteps: 3.99e+06
VF_0_ExplainedVarNew: 0.773
VF_0_ExplainedVarOld: 0.697
VF_0_Loss : 0.0912


Dynamics: Max Disturbance (m/s^2):  [0.00118983 0.00181235 0.00221757] 0.003101278765112381
ADV1:  0.029782127571469717 0.17004930343294997 2.1610727534761374 -1.7730684892336548
ADV2:  -0.032750226296116014 0.7145074237383583 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3839   0.1502   0.6630   2.9177   1.3316   0.9317
ValFun  Grad

ADV1:  0.014462453291739879 0.15589374056795563 1.5983593319369536 -1.8261169185212025
ADV2:  -0.004837337054134051 0.6991981463654344 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4842   0.2046   0.8468   2.9177   1.3316   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0208   0.0117   0.0476   5.4889   2.1784   2.1397
***** Episode 13305, Mean R = -88.2  Std R = 36.8  Min R = -160.1
PolicyLoss: -0.00499
Policy_Beta: 0.0667
Policy_Entropy: 0.0114
Policy_KL: 0.000896
Policy_SD: 0.923
Policy_lr_mult: 1
Steps: 1.12e+04
TotalSteps: 4.09e+06
VF_0_ExplainedVarNew: 0.752
VF_0_ExplainedVarOld: 0.591
VF_0_Loss : 0.083


Dynamics: Max Disturbance (m/s^2):  [0.00118983 0.00181235 0.00221757] 0.003101278765112381
ADV1:  0.028115742248173044 0.14688524497718014 1.9088916923042667 -1.4679823541641257
ADV2:  -0.020438054815115604 0.6585037605943143 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3862   0.1549   0.7180   2.9177   1.3316   0.9317
ValFun  Gradi

ADV1:  -0.01884062002903821 0.15129413382041096 2.17240511697688 -2.316451417009038
ADV2:  0.034484405176549986 0.6540156684215553 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5999   0.2848   1.4663   2.9177   1.4655   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0291   0.0147   0.0583   5.4889   2.1784   2.1397
***** Episode 13584, Mean R = -90.4  Std R = 41.7  Min R = -169.9
PolicyLoss: -0.0298
Policy_Beta: 0.0667
Policy_Entropy: 0.0124
Policy_KL: 0.00101
Policy_SD: 0.92
Policy_lr_mult: 1
Steps: 1.11e+04
TotalSteps: 4.19e+06
VF_0_ExplainedVarNew: 0.757
VF_0_ExplainedVarOld: 0.676
VF_0_Loss : 0.0706


Dynamics: Max Disturbance (m/s^2):  [0.00118983 0.00181235 0.00221757] 0.003101278765112381
ADV1:  0.009498994142395514 0.12267326198526554 1.1111698180541043 -1.343793709153258
ADV2:  -0.010956371943338438 0.730287367994185 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4929   0.1544   0.7794   2.9177   1.4655   0.9317
ValFun  Gradients: u/

ADV1:  0.010363668570990098 0.10412743265944582 0.8597822652593705 -2.272327627080086
ADV2:  0.0009292675710620431 0.6477576978599293 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5282   0.1613   0.9912   2.9177   1.4655   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0210   0.0073   0.0332   5.4889   2.1784   2.1397
***** Episode 13863, Mean R = -74.5  Std R = 36.2  Min R = -160.2
PolicyLoss: -0.012
Policy_Beta: 0.0667
Policy_Entropy: 0.013
Policy_KL: 0.000816
Policy_SD: 0.913
Policy_lr_mult: 1
Steps: 1.16e+04
TotalSteps: 4.29e+06
VF_0_ExplainedVarNew: 0.754
VF_0_ExplainedVarOld: 0.668
VF_0_Loss : 0.136


Dynamics: Max Disturbance (m/s^2):  [0.00118983 0.00181235 0.00221757] 0.003101278765112381
ADV1:  -0.02731902996568427 0.15848665846881024 1.2820605514533159 -2.441724431412556
ADV2:  0.0569585696399431 0.5379206368751858 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4054   0.1471   0.7885   2.9177   1.4655   0.9317
ValFun  Gradients: u/

ADV1:  -0.011290642161011598 0.09814139594889236 0.9753072295474693 -1.9286898096402507
ADV2:  0.022363549650014903 0.55353796131693 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3383   0.1326   0.6783   2.9177   1.4655   0.9317
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0158   0.0079   0.0351   5.4889   2.1784   2.1397
***** Episode 14142, Mean R = -69.3  Std R = 32.3  Min R = -165.8
PolicyLoss: -0.017
Policy_Beta: 0.0667
Policy_Entropy: 0.0137
Policy_KL: 0.000685
Policy_SD: 0.907
Policy_lr_mult: 1
Steps: 1.17e+04
TotalSteps: 4.4e+06
VF_0_ExplainedVarNew: 0.732
VF_0_ExplainedVarOld: 0.553
VF_0_Loss : 0.144


Dynamics: Max Disturbance (m/s^2):  [0.00118983 0.00181235 0.00221757] 0.003101278765112381
ADV1:  -0.0023749895137474305 0.08782342435350463 1.062311795307207 -1.9443154064814272
ADV2:  0.037410617058653846 0.5660068875534775 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3699   0.1406   0.8465   2.9177   1.4655   0.9317
ValFun  Gradients:

Dynamics: Max Disturbance (m/s^2):  [0.00118983 0.00181235 0.00221757] 0.003101278765112381
ADV1:  0.008816962045102636 0.0718279757887702 2.414636580149333 -0.849777879714968
ADV2:  -0.03901513991489198 0.5844453192866469 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5137   0.2183   1.2482   6.0107   2.9524   1.5640
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0154   0.0070   0.0260   5.4889   2.1784   2.1397
***** Episode 14421, Mean R = -59.3  Std R = 20.8  Min R = -132.7
PolicyLoss: 0.0303
Policy_Beta: 0.0667
Policy_Entropy: 0.014
Policy_KL: 0.000725
Policy_SD: 0.897
Policy_lr_mult: 1
Steps: 1.16e+04
TotalSteps: 4.5e+06
VF_0_ExplainedVarNew: 0.651
VF_0_ExplainedVarOld: 0.472
VF_0_Loss : 0.119


ADV1:  0.001713402345798289 0.03176318042935722 0.23198674027697752 -0.31179774243948527
ADV2:  -0.010790353773738662 0.9203418642315147 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6884   0.2574   1.2219   6.0107   2.9524   1.5640
ValFun  Gradients: 

Dynamics: Max Disturbance (m/s^2):  [0.00118983 0.00181235 0.00221757] 0.003101278765112381
ADV1:  -0.00571816097448397 0.028638710618207747 0.5633023938322677 -0.1577147296116634
ADV2:  -0.002113422602576423 0.8088971040759617 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4368   0.7118   2.7917   6.0107   2.9524   1.5640
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0063   0.0040   0.0148   5.4889   2.1784   2.1397
***** Episode 14700, Mean R = -49.8  Std R = 9.8  Min R = -79.9
PolicyLoss: 0.0112
Policy_Beta: 0.0667
Policy_Entropy: 0.0152
Policy_KL: 0.000934
Policy_SD: 0.887
Policy_lr_mult: 1
Steps: 1.16e+04
TotalSteps: 4.6e+06
VF_0_ExplainedVarNew: 0.747
VF_0_ExplainedVarOld: 0.668
VF_0_Loss : 0.107


ADV1:  -0.0025680016706889188 0.0457907072022719 0.20284633398056034 -1.2021033947194826
ADV2:  0.03549631978938596 0.5436902226634562 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5091   0.2169   1.2345   6.0107   2.9524   1.5640
ValFun  Gradients

Dynamics: Max Disturbance (m/s^2):  [0.00118983 0.00181235 0.00221757] 0.003101278765112381
ADV1:  -0.0009258376026626041 0.022906368062291186 0.15550235937686613 -0.14517038396900375
ADV2:  0.0034623742956770144 0.9328053731487608 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9430   0.5200   2.6384   6.0107   2.9524   1.5640
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0005   0.0022   5.4889   2.1784   2.1397
***** Episode 14979, Mean R = -49.6  Std R = 13.5  Min R = -78.4
PolicyLoss: -0.00474
Policy_Beta: 0.0667
Policy_Entropy: 0.0169
Policy_KL: 0.000917
Policy_SD: 0.882
Policy_lr_mult: 1
Steps: 1.18e+04
TotalSteps: 4.71e+06
VF_0_ExplainedVarNew: 0.847
VF_0_ExplainedVarOld: 0.841
VF_0_Loss : 0.0807


ADV1:  -0.0015731080643252473 0.07362032657256264 0.15911865190191812 -2.1061314670244875
ADV2:  0.03728568166946625 0.3617418906862468 2.1163151751280025 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2557   0.0970   0.5522   6.0107   2.9524  

***** Episode 15227, Mean R = -48.5  Std R = 12.7  Min R = -72.4
PolicyLoss: -0.0093
Policy_Beta: 0.0667
Policy_Entropy: 0.0184
Policy_KL: 0.001
Policy_SD: 0.871
Policy_lr_mult: 1
Steps: 1.17e+04
TotalSteps: 4.8e+06
VF_0_ExplainedVarNew: 0.772
VF_0_ExplainedVarOld: 0.761
VF_0_Loss : 0.129


ADV1:  0.007419847884653837 0.022676914580612273 0.13965387036403024 -0.09674179534117378
ADV2:  -0.02815429735871409 0.9408112642822777 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7322   0.2799   1.6018   6.0107   2.9557   1.6711
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0080   0.0052   0.0195   5.4889   2.1784   2.1397
***** Episode 15258, Mean R = -47.8  Std R = 13.6  Min R = -83.4
PolicyLoss: 0.001
Policy_Beta: 0.0667
Policy_Entropy: 0.0183
Policy_KL: 0.000836
Policy_SD: 0.871
Policy_lr_mult: 1
Steps: 1.18e+04
TotalSteps: 4.81e+06
VF_0_ExplainedVarNew: 0.834
VF_0_ExplainedVarOld: 0.829
VF_0_Loss : 0.105


ADV1:  0.0018568970031879806 0.01979658437162304 0.14437707533

cs_angles | -0.0052 -0.0017 |  0.1300  0.1257 | -0.9976 -0.9994 |  0.9916  0.9990
optical_flow | -0.0001 -0.0000 |  0.0263  0.0292 | -1.4232 -1.2716 |  1.0633  1.1411
v_err    | -0.0100 |  0.0642 | -0.5003 |  0.2225
landing_rewards |    7.55 |    4.30 |    0.00 |   10.00
landing_margin |    0.06 |    1.25 |   -0.07 |   22.03
tracking_rewards |  -40.88 |   10.71 |  -81.29 |  -24.15
steps    |     377 |      20 |     333 |     420
***** Episode 15537, Mean R = -38.0  Std R = 8.9  Min R = -63.5
PolicyLoss: -0.0065
Policy_Beta: 0.0667
Policy_Entropy: 0.02
Policy_KL: 0.000762
Policy_SD: 0.85
Policy_lr_mult: 1
Steps: 1.17e+04
TotalSteps: 4.92e+06
VF_0_ExplainedVarNew: 0.832
VF_0_ExplainedVarOld: 0.824
VF_0_Loss : 0.102


ADV1:  -0.005502097175622141 0.020236707060015496 0.13838556177735384 -0.14914340512006713
ADV2:  0.023163791687970732 0.9212133349301502 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1363   1.8073   5.6268   6.0107   2.9557   1.8073
ValFun  Gradients: u/sd/M

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.05    0.08 |    0.63    1.84 |   -1.44   -3.11 |    1.31    3.13
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.07   -0.03   -0.04 |    0.05    0.04    0.04
w_rewards |   -0.00 |    0.02 |   -0.19 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.38 |    0.24 |    0.00 |    1.68
seeker_angles |   -0.01   -0.00 |    0.12    0.12 |   -1.00   -1.00 |    1.00    0.99
cs_angles | -0.0080 -0.0020 |  0.1210  0.1203 | -0.9995 -0.9961 |  0.9996  0.9943
optical_flow | -0.0001  0.0001 |  0.0265  0.0299 | -0.9536 -1.2112 |  1.6935  1.6469
v_err    | -0.0110 |  0.0641 | -0.5000 |  0.1636
landing_rewards |    7.19 |    4.49 |    0.00 |   10.00
landing_margin |   -0.01 |    0.03 |   -0.09 |    0.11
tracking_rewards |  -38.40 |    9.85 |  -96.17 |  -20.72
steps    |     376 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.01 |    0.65    1.85 |   -1.40   -3.13 |    1.42    3.14
w_f      |   -0.00   -0.00    0.00 |    0.03    0.01    0.01 |   -0.07   -0.03   -0.04 |    0.05    0.04    0.05
w_rewards |   -0.00 |    0.02 |   -0.19 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.37 |    0.24 |    0.00 |    1.80
seeker_angles |   -0.00    0.00 |    0.11    0.12 |   -0.99   -1.00 |    1.00    0.99
cs_angles | -0.0038  0.0009 |  0.1142  0.1162 | -0.9929 -0.9990 |  0.9964  0.9863
optical_flow | -0.0002  0.0003 |  0.0258  0.0279 | -1.1385 -1.0230 |  1.0627  1.2779
v_err    | -0.0104 |  0.0639 | -0.4917 |  0.4316
landing_rewards |    7.39 |    4.39 |    0.00 |   10.00
landing_margin |    1.53 |   27.21 |   -0.08 |  479.79
tracking_rewards |  -36.11 |    8.95 |  -84.08 |  -19.97
steps    |     376 |  

attitude |   -0.04    0.03   -0.15 |    1.20    0.66    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.01   -0.26 |    0.65    1.77 |   -1.42   -3.13 |    1.46    3.06
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.07   -0.03   -0.03 |    0.06    0.04    0.05
w_rewards |   -0.00 |    0.02 |   -0.29 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.37 |    0.25 |    0.00 |    1.85
seeker_angles |    0.00    0.00 |    0.11    0.11 |   -0.99   -0.99 |    1.00    1.00
cs_angles |  0.0042  0.0005 |  0.1111  0.1121 | -0.9909 -0.9926 |  0.9973  0.9998
optical_flow |  0.0000  0.0001 |  0.0272  0.0281 | -1.1533 -1.1617 |  1.2894  1.0404
v_err    | -0.0103 |  0.0633 | -0.5003 |  0.1889
landing_rewards |    7.16 |    4.51 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.01    0.00 |    0.67    1.90 |   -1.49   -3.14 |    1.50    3.13
w_f      |   -0.00   -0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.04   -0.03 |    0.06    0.03    0.04
w_rewards |   -0.00 |    0.02 |   -0.25 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.25 |    0.00 |    1.91
seeker_angles |    0.01    0.00 |    0.11    0.11 |   -0.99   -0.99 |    1.00    0.99
cs_angles |  0.0051  0.0027 |  0.1085  0.1076 | -0.9923 -0.9889 |  0.9973  0.9933
optical_flow | -0.0002  0.0001 |  0.0276  0.0291 | -1.5326 -1.6223 |  1.4270  1.2846
v_err    | -0.0100 |  0.0628 | -0.5003 |  0.1817
landing_rewards |    6.97 |    4.60 |    0.00 |   10.00
landing_margin |   -0.00 |    0.17 |   -0.07 |    2.97
tracking_rewards |  -32.70 |    8.78 |  -93.05 |  -17.81
steps    |     373 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.01    0.15 |    0.67    1.82 |   -1.56   -3.14 |    1.51    3.14
w_f      |   -0.00   -0.00    0.00 |    0.03    0.01    0.01 |   -0.07   -0.04   -0.04 |    0.06    0.03    0.03
w_rewards |   -0.00 |    0.02 |   -0.23 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.35 |    0.25 |    0.00 |    1.65
seeker_angles |    0.01    0.00 |    0.11    0.11 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0100  0.0047 |  0.1057  0.1095 | -0.9937 -0.9988 |  0.9995  0.9924
optical_flow |  0.0001  0.0000 |  0.0265  0.0281 | -1.1538 -1.2784 |  1.1667  1.2427
v_err    | -0.0097 |  0.0625 | -0.5000 |  0.4777
landing_rewards |    6.74 |    4.69 |    0.00 |   10.00
landing_margin |    1.20 |   21.32 |   -0.07 |  376.02
tracking_rewards |  -31.86 |    8.08 |  -61.56 |  -17.74
steps    |     371 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.10    0.05 |    0.64    1.78 |   -1.47   -3.09 |    1.31    3.05
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.07   -0.04   -0.04 |    0.06    0.03    0.03
w_rewards |   -0.01 |    0.02 |   -0.23 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.25 |    0.00 |    1.77
seeker_angles |    0.01    0.00 |    0.10    0.11 |   -0.99   -0.99 |    0.97    1.00
cs_angles |  0.0078  0.0015 |  0.1032  0.1053 | -0.9925 -0.9945 |  0.9731  0.9987
optical_flow |  0.0001  0.0002 |  0.0276  0.0278 | -1.1017 -1.3481 |  1.2416  1.0468
v_err    | -0.0103 |  0.0613 | -0.4955 |  0.1714
landing_rewards |    7.06 |    4.55 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.08 |    0.09
tracking_rewards |  -30.65 |    8.52 |  -69.37 |  -16.86
steps    |     378 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.06   -0.04 |    0.66    1.84 |   -1.53   -3.13 |    1.49    3.14
w_f      |   -0.01   -0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.03   -0.03 |    0.06    0.04    0.04
w_rewards |   -0.01 |    0.03 |   -0.31 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.26 |    0.00 |    1.89
seeker_angles |    0.02   -0.00 |    0.10    0.11 |   -0.98   -1.00 |    1.00    0.99
cs_angles |  0.0153 -0.0029 |  0.1006  0.1076 | -0.9764 -0.9997 |  0.9965  0.9885
optical_flow |  0.0000  0.0003 |  0.0262  0.0288 | -1.2359 -1.2857 |  0.9314  1.0819
v_err    | -0.0104 |  0.0612 | -0.4985 |  0.1815
landing_rewards |    6.94 |    4.61 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.06 |    0.10
tracking_rewards |  -30.65 |    7.78 |  -79.30 |  -17.43
steps    |     377 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.07    0.05    0.05
a_f      |   -0.02   -0.11 |    0.68    1.88 |   -1.53   -3.14 |    1.51    3.13
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.04   -0.04 |    0.07    0.04    0.04
w_rewards |   -0.00 |    0.01 |   -0.16 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.26 |    0.00 |    1.55
seeker_angles |    0.02    0.00 |    0.10    0.10 |   -1.00   -0.98 |    1.00    1.00
cs_angles |  0.0176  0.0009 |  0.1011  0.1019 | -0.9984 -0.9816 |  0.9976  0.9997
optical_flow | -0.0001  0.0002 |  0.0274  0.0285 | -1.5733 -1.4955 |  1.1098  1.2893
v_err    | -0.0101 |  0.0613 | -0.4963 |  0.1493
landing_rewards |    7.03 |    4.57 |    0.00 |   10.00
landing_margin |   -0.01 |    0.03 |   -0.07 |    0.07
tracking_rewards |  -29.70 |    7.87 |  -59.43 |  -15.40
steps    |     375 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.01 |    0.63    1.77 |   -1.50   -3.13 |    1.37    3.12
w_f      |   -0.00    0.00   -0.00 |    0.03    0.01    0.01 |   -0.06   -0.03   -0.04 |    0.05    0.04    0.03
w_rewards |   -0.00 |    0.01 |   -0.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.27 |    0.00 |    1.51
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -0.99   -0.99 |    0.97    1.00
cs_angles |  0.0077  0.0040 |  0.1045  0.1036 | -0.9879 -0.9947 |  0.9750  0.9997
optical_flow |  0.0001  0.0000 |  0.0269  0.0274 | -1.0935 -1.3344 |  1.2811  1.5094
v_err    | -0.0103 |  0.0612 | -0.4705 |  0.1612
landing_rewards |    7.03 |    4.57 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.06 |    0.09
tracking_rewards |  -29.92 |    7.56 |  -52.05 |  -16.50
steps    |     375 |  

w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.03    0.08 |    0.69    1.77 |   -1.36   -3.13 |    1.51    3.12
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.05   -0.03 |    0.06    0.04    0.04
w_rewards |   -0.00 |    0.01 |   -0.17 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.26 |    0.00 |    1.50
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0060  0.0022 |  0.0998  0.1029 | -0.9871 -0.9990 |  0.9920  0.9948
optical_flow |  0.0000  0.0000 |  0.0284  0.0295 | -1.2768 -1.5853 |  1.7079  1.3246
v_err    | -0.0097 |  0.0612 | -0.4714 |  0.1399
landing_rewards |    7.55 |    4.30 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.08 |    0.06
tracking_rewards |  -28.56 |    7.15 |  -55.01 |  -16.03
steps    |     376 |  

attitude |   -0.06   -0.02   -0.17 |    1.20    0.62    1.88 |   -3.14   -1.55   -3.14 |    3.14    1.53    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.07    0.05    0.05
a_f      |   -0.02   -0.08 |    0.65    1.87 |   -1.54   -3.12 |    1.37    3.14
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.07   -0.03   -0.04 |    0.07    0.04    0.04
w_rewards |   -0.01 |    0.03 |   -0.29 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.26 |    0.00 |    1.55
seeker_angles |    0.00   -0.00 |    0.09    0.10 |   -1.00   -0.99 |    1.00    1.00
cs_angles |  0.0019 -0.0024 |  0.0942  0.1016 | -0.9968 -0.9913 |  0.9989  0.9991
optical_flow |  0.0001  0.0001 |  0.0269  0.0277 | -1.1495 -1.0405 |  1.0931  1.3540
v_err    | -0.0094 |  0.0605 | -0.4527 |  0.1612
landing_rewards |    7.26 |    4.46 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.09    0.00   -0.12 |    1.15    0.66    1.84 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.18 |    0.66    1.83 |   -1.48   -3.13 |    1.40    3.12
w_f      |   -0.00    0.00   -0.00 |    0.03    0.01    0.01 |   -0.05   -0.03   -0.04 |    0.05    0.04    0.04
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.26 |    0.00 |    2.04
seeker_angles |    0.00   -0.00 |    0.10    0.10 |   -1.00   -1.00 |    1.00    0.97
cs_angles |  0.0044 -0.0008 |  0.0993  0.1005 | -0.9981 -0.9954 |  1.0000  0.9695
optical_flow | -0.0000  0.0000 |  0.0288  0.0262 | -1.2442 -1.0571 |  1.3180  0.9541
v_err    | -0.0094 |  0.0602 | -0.4999 |  0.1470
landing_rewards |    7.42 |    4.38 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.07    0.04   -0.09 |    1.17    0.63    1.87 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.23 |    0.64    1.85 |   -1.50   -3.12 |    1.44    3.14
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.03   -0.03 |    0.05    0.04    0.04
w_rewards |   -0.00 |    0.01 |   -0.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.26 |    0.00 |    1.47
seeker_angles |    0.00    0.00 |    0.09    0.10 |   -1.00   -1.00 |    0.99    0.98
cs_angles |  0.0036  0.0008 |  0.0948  0.0965 | -0.9997 -0.9995 |  0.9915  0.9778
optical_flow |  0.0000 -0.0001 |  0.0267  0.0268 | -1.0893 -1.1728 |  1.3898  1.2732
v_err    | -0.0096 |  0.0603 | -0.4989 |  0.1666
landing_rewards |    7.16 |    4.51 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.02   -0.04   -0.08 |    1.23    0.66    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.03    0.01 |    0.68    1.87 |   -1.49   -3.14 |    1.52    3.12
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.04   -0.03 |    0.06    0.04    0.04
w_rewards |   -0.00 |    0.01 |   -0.16 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.26 |    0.00 |    1.44
seeker_angles |    0.00   -0.00 |    0.09    0.10 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0001 -0.0023 |  0.0933  0.0981 | -0.9884 -0.9952 |  0.9989  0.9973
optical_flow | -0.0001  0.0001 |  0.0267  0.0272 | -1.1593 -1.1193 |  1.0637  0.9590
v_err    | -0.0094 |  0.0600 | -0.5001 |  0.1470
landing_rewards |    7.45 |    4.36 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.10    0.03    0.07 |    1.10    0.65    1.80 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03    0.06 |    0.65    1.83 |   -1.55   -3.12 |    1.53    3.11
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.07   -0.03   -0.04 |    0.05    0.04    0.04
w_rewards |   -0.00 |    0.02 |   -0.28 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.26 |    0.00 |    1.69
seeker_angles |    0.00   -0.00 |    0.09    0.10 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0015 -0.0004 |  0.0921  0.1004 | -0.9944 -0.9973 |  0.9990  0.9891
optical_flow |  0.0003  0.0000 |  0.0264  0.0266 | -1.2914 -1.4305 |  1.1734  1.4172
v_err    | -0.0096 |  0.0596 | -0.4531 |  0.1537
landing_rewards |    7.29 |    4.44 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.06    0.17 |    0.64    1.84 |   -1.55   -3.13 |    1.39    3.14
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.08   -0.04   -0.03 |    0.05    0.04    0.03
w_rewards |   -0.00 |    0.02 |   -0.34 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.26 |    0.00 |    1.59
seeker_angles |    0.01    0.00 |    0.09    0.10 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0080  0.0023 |  0.0911  0.0979 | -0.9944 -0.9975 |  0.9863  0.9900
optical_flow | -0.0001  0.0001 |  0.0275  0.0267 | -1.2421 -1.1078 |  1.1647  1.4275
v_err    | -0.0100 |  0.0598 | -0.4771 |  0.1548
landing_rewards |    7.65 |    4.24 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.06 |    0.07
tracking_rewards |  -26.01 |    6.76 |  -64.25 |  -14.19
steps    |     377 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.03 |    0.67    1.86 |   -1.43   -3.09 |    1.46    3.14
w_f      |    0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.03   -0.03 |    0.05    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.26 |    0.00 |    1.39
seeker_angles |    0.01   -0.00 |    0.09    0.10 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0054 -0.0023 |  0.0916  0.0959 | -0.9973 -0.9977 |  0.9927  0.9986
optical_flow | -0.0000 -0.0001 |  0.0275  0.0264 | -1.2668 -1.0487 |  0.9448  0.9495
v_err    | -0.0101 |  0.0599 | -0.4530 |  0.1577
landing_rewards |    7.61 |    4.26 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.08 |    0.10
tracking_rewards |  -25.60 |    6.55 |  -54.79 |  -14.96
steps    |     376 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.02    0.03 |    0.66    1.87 |   -1.53   -3.12 |    1.55    3.12
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.07   -0.04   -0.03 |    0.06    0.04    0.03
w_rewards |   -0.00 |    0.02 |   -0.19 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.26 |    0.00 |    1.75
seeker_angles |    0.01    0.00 |    0.09    0.10 |   -0.99   -1.00 |    1.00    0.98
cs_angles |  0.0095  0.0005 |  0.0885  0.0974 | -0.9905 -0.9976 |  0.9956  0.9770
optical_flow |  0.0001  0.0000 |  0.0282  0.0257 | -1.3792 -1.1015 |  1.2467  0.9182
v_err    | -0.0100 |  0.0589 | -0.4897 |  0.1458
landing_rewards |    7.81 |    4.14 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.07 |    0.06
tracking_rewards |  -25.14 |    6.29 |  -50.94 |  -14.40
steps    |     377 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.05   -0.01 |    0.66    1.90 |   -1.51   -3.11 |    1.45    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.03   -0.04 |    0.05    0.04    0.05
w_rewards |   -0.00 |    0.01 |   -0.12 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.26 |    0.00 |    1.43
seeker_angles |    0.01    0.00 |    0.09    0.09 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0099  0.0007 |  0.0921  0.0936 | -0.9911 -0.9971 |  0.9982  0.9984
optical_flow |  0.0000 -0.0000 |  0.0268  0.0264 | -1.0320 -1.2222 |  1.1426  1.3794
v_err    | -0.0101 |  0.0590 | -0.4534 |  0.1534
landing_rewards |    7.77 |    4.16 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.08
tracking_rewards |  -24.92 |    6.58 |  -59.78 |  -14.93
steps    |     375 |  

attitude |   -0.00    0.00   -0.01 |    1.22    0.67    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.01   -0.09 |    0.67    1.94 |   -1.46   -3.13 |    1.51    3.14
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.07   -0.04   -0.04 |    0.06    0.04    0.03
w_rewards |   -0.00 |    0.01 |   -0.18 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.26 |    0.00 |    1.56
seeker_angles |    0.02   -0.00 |    0.09    0.09 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0163 -0.0004 |  0.0916  0.0912 | -0.9970 -0.9933 |  0.9876  0.9987
optical_flow |  0.0001  0.0001 |  0.0275  0.0270 | -1.1713 -0.9124 |  1.0311  0.9690
v_err    | -0.0101 |  0.0590 | -0.4528 |  0.1378
landing_rewards |    8.52 |    3.55 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.11    0.03   -0.02 |    1.19    0.67    1.80 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04   -0.14 |    0.68    1.80 |   -1.49   -3.13 |    1.49    3.14
w_f      |   -0.00    0.00   -0.00 |    0.03    0.01    0.01 |   -0.06   -0.03   -0.03 |    0.05    0.05    0.04
w_rewards |   -0.00 |    0.01 |   -0.22 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.26 |    0.00 |    1.40
seeker_angles |    0.01    0.00 |    0.09    0.10 |   -1.00   -0.98 |    0.98    0.98
cs_angles |  0.0111  0.0026 |  0.0879  0.0951 | -0.9998 -0.9771 |  0.9813  0.9756
optical_flow | -0.0000 -0.0001 |  0.0265  0.0261 | -1.0993 -0.9466 |  1.2278  1.3413
v_err    | -0.0099 |  0.0591 | -0.5000 |  0.1314
landing_rewards |    8.06 |    3.95 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.06    0.02 |    0.66    1.83 |   -1.51   -3.11 |    1.42    3.14
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.03   -0.03 |    0.06    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.15 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.26 |    0.00 |    1.33
seeker_angles |    0.01    0.00 |    0.09    0.09 |   -0.99   -0.98 |    0.99    0.99
cs_angles |  0.0055  0.0032 |  0.0899  0.0937 | -0.9939 -0.9809 |  0.9925  0.9903
optical_flow |  0.0001  0.0001 |  0.0273  0.0256 | -0.9838 -1.1530 |  1.2858  0.9284
v_err    | -0.0097 |  0.0599 | -0.4528 |  0.1633
landing_rewards |    7.94 |    4.05 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.07
tracking_rewards |  -24.50 |    5.53 |  -44.38 |  -14.55
steps    |     374 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.01   -0.27 |    0.68    1.84 |   -1.55   -3.12 |    1.55    3.10
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.07   -0.04   -0.04 |    0.06    0.03    0.04
w_rewards |   -0.00 |    0.02 |   -0.29 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.27 |    0.00 |    1.43
seeker_angles |    0.01    0.00 |    0.09    0.09 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0059  0.0050 |  0.0947  0.0948 | -0.9963 -0.9987 |  0.9977  0.9986
optical_flow | -0.0000  0.0001 |  0.0268  0.0262 | -1.1060 -1.1838 |  1.1225  1.2444
v_err    | -0.0097 |  0.0592 | -0.4532 |  0.1754
landing_rewards |    7.81 |    4.14 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.05 |    0.12
tracking_rewards |  -24.90 |    6.48 |  -61.46 |  -13.43
steps    |     375 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05   -0.01 |    0.70    1.86 |   -1.53   -3.14 |    1.48    3.14
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.04   -0.03 |    0.05    0.03    0.02
w_rewards |   -0.00 |    0.01 |   -0.11 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.25 |    0.00 |    1.42
seeker_angles |    0.01    0.00 |    0.09    0.09 |   -1.00   -0.99 |    0.97    1.00
cs_angles |  0.0075  0.0042 |  0.0866  0.0931 | -0.9994 -0.9928 |  0.9682  0.9968
optical_flow | -0.0000  0.0001 |  0.0256  0.0271 | -1.2375 -1.1434 |  1.1268  1.0001
v_err    | -0.0100 |  0.0594 | -0.4586 |  0.1396
landing_rewards |    7.77 |    4.16 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.08 |    0.08
tracking_rewards |  -23.84 |    6.10 |  -51.64 |  -13.50
steps    |     376 |  

attitude |   -0.03    0.01    0.00 |    1.13    0.65    1.80 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.01    0.05 |    0.66    1.78 |   -1.42   -3.13 |    1.43    3.09
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.04   -0.03 |    0.06    0.04    0.03
w_rewards |   -0.00 |    0.01 |   -0.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.25 |    0.00 |    1.49
seeker_angles |    0.01    0.00 |    0.09    0.09 |   -1.00   -1.00 |    0.99    0.99
cs_angles |  0.0055  0.0048 |  0.0872  0.0894 | -0.9972 -0.9988 |  0.9925  0.9875
optical_flow |  0.0002  0.0001 |  0.0267  0.0273 | -1.1822 -1.4371 |  1.1900  1.0668
v_err    | -0.0098 |  0.0591 | -0.4574 |  0.1506
landing_rewards |    7.71 |    4.20 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.09   -0.20 |    0.67    1.72 |   -1.31   -3.10 |    1.47    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.04   -0.04 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.26 |    0.00 |    1.40
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0014  0.0043 |  0.0911  0.0891 | -0.9981 -0.9898 |  0.9978  0.9947
optical_flow |  0.0001 -0.0000 |  0.0262  0.0266 | -0.9331 -1.0852 |  1.3795  1.0357
v_err    | -0.0098 |  0.0593 | -0.4529 |  0.1614
landing_rewards |    7.97 |    4.02 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.08
tracking_rewards |  -23.72 |    5.72 |  -64.38 |  -13.02
steps    |     374 |  

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00   -0.01 |    0.66    1.84 |   -1.51   -3.13 |    1.53    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.05    0.04    0.03
w_rewards |   -0.00 |    0.00 |   -0.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.26 |    0.00 |    1.34
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.98 |    1.00    0.98
cs_angles |  0.0034  0.0027 |  0.0887  0.0913 | -0.9935 -0.9769 |  0.9978  0.9843
optical_flow |  0.0002  0.0001 |  0.0261  0.0268 | -0.9723 -1.1650 |  1.3404  1.1064
v_err    | -0.0096 |  0.0590 | -0.4530 |  0.1387
landing_rewards |    8.32 |    3.74 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.06
tracking_rewards |  -23.46 |    5.54 |  -47.63 |  -13.28
steps    |     375 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01    0.01 |    0.65    1.95 |   -1.55   -3.12 |    1.49    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.02 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.26 |    0.00 |    1.50
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.98 |    1.00    1.00
cs_angles |  0.0044  0.0025 |  0.0883  0.0929 | -0.9887 -0.9834 |  0.9998  0.9970
optical_flow |  0.0001 -0.0000 |  0.0268  0.0265 | -1.3032 -1.2284 |  1.0782  1.3522
v_err    | -0.0091 |  0.0586 | -0.4999 |  0.1370
landing_rewards |    7.90 |    4.07 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.06
tracking_rewards |  -23.62 |    6.04 |  -59.49 |  -13.80
steps    |     377 |  

w        |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.03   -0.04 |    0.63    1.90 |   -1.37   -3.13 |    1.49    3.12
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.07   -0.03   -0.04 |    0.06    0.04    0.04
w_rewards |   -0.00 |    0.01 |   -0.17 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.25 |    0.00 |    1.43
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0013  0.0043 |  0.0858  0.0869 | -0.9981 -0.9987 |  0.9942  0.9967
optical_flow |  0.0000  0.0000 |  0.0266  0.0265 | -1.2597 -0.9524 |  1.2819  1.1669
v_err    | -0.0092 |  0.0592 | -0.4504 |  0.1389
landing_rewards |    7.94 |    4.05 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.06 |    0.05
tracking_rewards |  -22.76 |    4.95 |  -43.07 |  -13.27
steps    |     375 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.01    0.16 |    0.66    1.87 |   -1.54   -3.11 |    1.55    3.12
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.03   -0.02 |    0.06    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.25 |    0.00 |    1.47
seeker_angles |   -0.00    0.00 |    0.09    0.08 |   -0.99   -0.98 |    1.00    1.00
cs_angles | -0.0000  0.0028 |  0.0881  0.0849 | -0.9902 -0.9841 |  0.9955  0.9969
optical_flow |  0.0001  0.0001 |  0.0279  0.0269 | -1.3422 -1.3306 |  1.5288  1.2603
v_err    | -0.0093 |  0.0586 | -0.4533 |  0.1506
landing_rewards |    8.35 |    3.71 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.06
tracking_rewards |  -22.67 |    5.30 |  -55.37 |  -13.47
steps    |     376 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.03   -0.13 |    0.66    1.77 |   -1.43   -3.10 |    1.46    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.03   -0.04 |    0.06    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.25 |    0.00 |    1.41
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.98   -1.00 |    1.00    0.99
cs_angles |  0.0031  0.0039 |  0.0860  0.0864 | -0.9845 -0.9978 |  0.9985  0.9892
optical_flow |  0.0001  0.0001 |  0.0270  0.0264 | -1.0056 -1.0123 |  1.1744  1.3642
v_err    | -0.0092 |  0.0587 | -0.4526 |  0.1529
landing_rewards |    8.06 |    3.95 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.07
tracking_rewards |  -22.53 |    4.95 |  -39.07 |  -13.34
steps    |     375 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.01   -0.02 |    0.67    1.87 |   -1.45   -3.11 |    1.48    3.14
w_f      |   -0.01    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.03   -0.03 |    0.06    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.41
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.99    1.00
cs_angles |  0.0041  0.0020 |  0.0900  0.0891 | -0.9905 -0.9981 |  0.9935  0.9989
optical_flow |  0.0002  0.0001 |  0.0281  0.0258 | -1.7895 -1.3442 |  1.2739  1.3388
v_err    | -0.0090 |  0.0586 | -0.4525 |  0.1381
landing_rewards |    8.06 |    3.95 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.06
tracking_rewards |  -22.88 |    5.32 |  -41.18 |  -12.88
steps    |     374 |  

attitude |    0.03    0.07    0.19 |    1.20    0.66    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.07    0.26 |    0.65    1.84 |   -1.49   -3.13 |    1.43    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.02   -0.03 |    0.05    0.04    0.03
w_rewards |   -0.00 |    0.00 |   -0.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.45
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.97 |    1.00    1.00
cs_angles |  0.0024  0.0017 |  0.0864  0.0867 | -0.9964 -0.9660 |  0.9982  1.0000
optical_flow | -0.0000  0.0000 |  0.0258  0.0268 | -1.0499 -1.0982 |  0.9792  1.1208
v_err    | -0.0092 |  0.0590 | -0.4537 |  0.1469
landing_rewards |    8.03 |    3.98 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04    0.00   -0.13 |    1.18    0.69    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.00   -0.19 |    0.68    1.82 |   -1.53   -3.13 |    1.52    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.06   -0.04   -0.03 |    0.06    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.06 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.25 |    0.00 |    1.56
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0010  0.0034 |  0.0837  0.0882 | -0.9963 -0.9873 |  0.9980  0.9926
optical_flow | -0.0000 -0.0000 |  0.0272  0.0260 | -1.1845 -1.0704 |  1.1229  1.2976
v_err    | -0.0089 |  0.0587 | -0.4521 |  0.1284
landing_rewards |    8.13 |    3.90 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.06 |    0.69    1.78 |   -1.54   -3.14 |    1.44    3.11
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.02 |    0.05    0.04    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.48
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.99    0.98
cs_angles |  0.0009  0.0028 |  0.0887  0.0885 | -0.9948 -0.9991 |  0.9923  0.9814
optical_flow |  0.0002 -0.0001 |  0.0266  0.0263 | -1.0732 -1.1593 |  1.3220  1.2072
v_err    | -0.0092 |  0.0584 | -0.4526 |  0.1434
landing_rewards |    8.06 |    3.95 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.05
tracking_rewards |  -22.63 |    5.19 |  -45.62 |  -13.24
steps    |     375 |  

attitude |    0.04    0.02    0.04 |    1.17    0.63    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.47    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.04 |    0.63    1.83 |   -1.51   -3.13 |    1.40    3.09
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.02   -0.03 |    0.05    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.09 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.25 |    0.00 |    1.48
seeker_angles |    0.00    0.01 |    0.09    0.08 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0050  0.0059 |  0.0855  0.0835 | -0.9924 -0.9985 |  0.9911  0.9942
optical_flow | -0.0000 -0.0001 |  0.0259  0.0256 | -1.1279 -0.9841 |  1.2242  1.1016
v_err    | -0.0093 |  0.0584 | -0.4536 |  0.1516
landing_rewards |    8.42 |    3.65 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.12 |    0.68    1.92 |   -1.45   -3.14 |    1.52    3.12
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.04    0.04
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.25 |    0.00 |    1.57
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -1.00   -0.96 |    1.00    0.99
cs_angles |  0.0021  0.0034 |  0.0815  0.0898 | -0.9950 -0.9575 |  0.9983  0.9930
optical_flow |  0.0001 -0.0000 |  0.0268  0.0263 | -1.3602 -1.0347 |  1.5118  1.2775
v_err    | -0.0097 |  0.0587 | -0.4524 |  0.1424
landing_rewards |    8.77 |    3.28 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.05
tracking_rewards |  -22.08 |    5.19 |  -49.92 |  -13.06
steps    |     376 |  

attitude |    0.04   -0.06    0.06 |    1.26    0.68    1.91 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05    0.01 |    0.67    1.87 |   -1.43   -3.14 |    1.49    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.03   -0.03 |    0.04    0.03    0.02
w_rewards |   -0.00 |    0.01 |   -0.09 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.25 |    0.00 |    1.65
seeker_angles |    0.00    0.01 |    0.09    0.09 |   -0.98   -0.99 |    0.99    0.99
cs_angles |  0.0033  0.0050 |  0.0862  0.0869 | -0.9819 -0.9883 |  0.9925  0.9928
optical_flow |  0.0001  0.0002 |  0.0265  0.0254 | -1.1946 -0.8617 |  1.1697  1.3774
v_err    | -0.0093 |  0.0587 | -0.4961 |  0.1379
landing_rewards |    8.48 |    3.59 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.09   -0.01   -0.05 |    1.22    0.64    1.94 |   -3.14   -1.51   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03   -0.04 |    0.63    1.93 |   -1.46   -3.14 |    1.49    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.03   -0.02 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.64
seeker_angles |    0.01    0.01 |    0.09    0.09 |   -0.99   -0.99 |    0.99    0.99
cs_angles |  0.0067  0.0050 |  0.0865  0.0915 | -0.9931 -0.9932 |  0.9927  0.9902
optical_flow |  0.0001  0.0000 |  0.0264  0.0258 | -1.0916 -1.1771 |  1.1623  1.0745
v_err    | -0.0092 |  0.0586 | -0.4517 |  0.1605
landing_rewards |    8.55 |    3.52 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.15    0.01    0.02 |    1.15    0.65    1.85 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.00 |    0.65    1.85 |   -1.52   -3.14 |    1.45    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.45
seeker_angles |    0.01    0.00 |    0.08    0.09 |   -1.00   -1.00 |    1.00    0.99
cs_angles |  0.0088  0.0037 |  0.0834  0.0927 | -0.9961 -0.9993 |  0.9965  0.9947
optical_flow | -0.0001  0.0001 |  0.0252  0.0249 | -1.1330 -0.9737 |  1.2557  1.2074
v_err    | -0.0090 |  0.0582 | -0.4523 |  0.1549
landing_rewards |    8.32 |    3.74 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.01 |    0.67    1.92 |   -1.46   -3.13 |    1.42    3.10
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.03   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.25 |    0.00 |    1.47
seeker_angles |    0.01    0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.99    0.98
cs_angles |  0.0079  0.0020 |  0.0849  0.0899 | -0.9905 -0.9985 |  0.9863  0.9796
optical_flow |  0.0001 -0.0001 |  0.0255  0.0245 | -0.9691 -1.0724 |  1.0694  0.9489
v_err    | -0.0091 |  0.0581 | -0.4521 |  0.1236
landing_rewards |    9.16 |    2.77 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.03
tracking_rewards |  -22.62 |    5.15 |  -47.66 |  -14.15
steps    |     377 |  

glideslope |    2.80 |   12.84 |    0.01 |  346.60
norm_af  |    1.73 |    0.89 |    0.11 |    3.37
norm_wf  |    0.02 |    0.01 |    0.00 |    0.06
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.19   -0.05    0.11 |    1.13    0.67    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05    0.10 |    0.68    1.82 |   -1.47   -3.09 |    1.50    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.04 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.48
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.

attitude |   -0.08    0.05    0.05 |    1.17    0.67    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.52    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.07 |    0.66    1.83 |   -1.44   -3.14 |    1.50    3.13
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.04   -0.03 |    0.05    0.03    0.04
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.25 |    0.00 |    1.46
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -1.00   -0.98 |    0.99    1.00
cs_angles |  0.0048  0.0028 |  0.0839  0.0890 | -0.9958 -0.9824 |  0.9881  0.9988
optical_flow |  0.0000  0.0000 |  0.0269  0.0251 | -1.0901 -1.3198 |  1.1566  1.0486
v_err    | -0.0101 |  0.0585 | -0.4549 |  0.1429
landing_rewards |    8.55 |    3.52 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.01    0.02   -0.07 |    1.15    0.66    1.89 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.16 |    0.67    1.88 |   -1.48   -3.14 |    1.46    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.04 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.24 |    0.00 |    1.36
seeker_angles |    0.01    0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.96    1.00
cs_angles |  0.0058  0.0013 |  0.0804  0.0859 | -0.9903 -0.9992 |  0.9615  0.9953
optical_flow | -0.0000  0.0001 |  0.0270  0.0253 | -1.0646 -1.1682 |  1.1456  1.1044
v_err    | -0.0100 |  0.0581 | -0.4533 |  0.1328
landing_rewards |    8.87 |    3.16 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.01    0.00   -0.00 |    0.70    0.71    0.70 |   -3.44   -3.34   -3.45 |    3.44    3.39    3.40
norm_thrust |    0.95 |    0.75 |    0.00 |    3.46
fuel     |    1.66 |    0.23 |    1.16 |    2.71
rewards  |  -18.10 |    6.77 |  -61.11 |   -7.54
fuel_rewards |   -4.77 |    0.66 |   -7.74 |   -3.34
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.86 |   13.14 |    0.01 |  190.65
norm_af  |    1.72 |    0.89 |    0.10 |    3.35
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.06   -0.01   -0.13 |    1.20    0.68    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.15 |    0.67

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0381   0.4732   2.1608  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0016   0.0059   5.4889   2.1784   2.1397
Update Cnt = 960    ET =   1149.6   Stats:  Mean, Std, Min, Max
r_f      |   -8.62   -0.26  -12.55 |  187.49  162.68  200.75 | -361.77 -383.28 -389.98 |  392.71  376.35  395.96
v_f      |    0.00    0.00    0.00 |    0.05    0.04    0.05 |   -0.12   -0.10   -0.11 |    0.12    0.11    0.10
r_i      |  -61.44  -22.33  -51.41 |  723.97  632.35  739.56 |-1371.70-1330.87-1281.60 | 1379.18 1239.91 1226.85
v_i      |    0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.10    0.09
norm_rf  |    0.29 |    0.12 |    0.04 |    0.79
norm_vf  |    0.08 |    0.02 |    0.03 |    0.14
gs_f     |    1.09 |    1.37 |    0.01 |   12.01
thrust   |   -0.00   -0.00    0.01 |    0.69    0.70    0.69 |   -3.36   -3.45   -3.46 |    3.31    3.24    3.43
norm_thrust |    0

ADV1:  0.0026100828779043366 0.011769305950691955 0.04912156486481903 -0.09519641503587098
ADV2:  0.0027418303698143257 0.8876796111598277 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8396   0.9226   4.7373  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0044   0.0024   0.0080   5.4889   2.1784   2.1397
***** Episode 30076, Mean R = -18.6  Std R = 7.1  Min R = -39.6
PolicyLoss: -0.0221
Policy_Beta: 0.1
Policy_Entropy: 0.132
Policy_KL: 0.00102
Policy_SD: 0.557
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.04e+07
VF_0_ExplainedVarNew: 0.954
VF_0_ExplainedVarOld: 0.947
VF_0_Loss : 0.0354


ADV1:  -0.0014721489843254995 0.011450369390062427 0.07647498335845898 -0.07984999228208733
ADV2:  0.019794635927425253 0.9122896144463202 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8458   1.3052   6.8141  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0016   0.0052   5.4889   2.1784   2.13

ADV1:  0.003962562848748418 0.010003609752135012 0.08224753903672777 -0.07965024776080334
ADV2:  -0.002661651855317265 0.8646166532083028 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7376   0.8485   3.6199  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0044   0.0028   0.0102   5.4889   2.1784   2.1397
***** Episode 30355, Mean R = -16.8  Std R = 7.4  Min R = -39.2
PolicyLoss: -0.0228
Policy_Beta: 0.1
Policy_Entropy: 0.133
Policy_KL: 0.00134
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.05e+07
VF_0_ExplainedVarNew: 0.965
VF_0_ExplainedVarOld: 0.961
VF_0_Loss : 0.0365


ADV1:  -0.0018392415451420666 0.007818208725826692 0.055186431133465164 -0.05676994958982334
ADV2:  0.028620990030515953 0.8782149887996249 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1497   0.5011   2.5344  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0012   0.0047   5.4889   2.1784   2.13

ADV1:  0.0016700906583214346 0.010629931418685602 0.05546911856411224 -0.07491934230503972
ADV2:  -0.003288271371975254 0.9130275441505589 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8274   0.3370   1.7635  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0014   0.0055   5.4889   2.1784   2.1397
***** Episode 30634, Mean R = -18.9  Std R = 6.1  Min R = -31.6
PolicyLoss: -0.0126
Policy_Beta: 0.1
Policy_Entropy: 0.133
Policy_KL: 0.000904
Policy_SD: 0.568
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.06e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.957
VF_0_Loss : 0.0324


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.0006778726933408992 0.011455410424918731 0.07644343641202783 -0.06631581688359324
ADV2:  0.01613426045350999 0.8981564312723811 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1168   0.7202   3.5254  24.0260  15.5251  10.0673
ValFun 

ADV1:  -0.0032560332692238452 0.010196044170423135 0.05205683469772343 -0.14235062915238111
ADV2:  0.04217283678265055 0.8536509256953508 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9576   0.5502   2.1345  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0044   0.0025   0.0094   5.4889   2.1784   2.1397
***** Episode 30913, Mean R = -16.0  Std R = 6.0  Min R = -32.2
PolicyLoss: -0.0257
Policy_Beta: 0.1
Policy_Entropy: 0.134
Policy_KL: 0.000944
Policy_SD: 0.56
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.07e+07
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.953
VF_0_Loss : 0.0265


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.0006679080092027652 0.009239605593067395 0.08258271596399314 -0.06429750157663588
ADV2:  0.009562781872532703 0.9193927354986534 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0029   0.4230   2.2124  24.0260  15.5251  10.0673
ValFun  G

ADV1:  3.642180504973736e-05 0.011611371091479016 0.05573905001667456 -0.07496805228662676
ADV2:  0.014929260358352792 0.8951310954071947 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8993   1.5391   7.6275  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0004   0.0015   5.4889   2.1784   2.1397
***** Episode 31192, Mean R = -16.7  Std R = 5.8  Min R = -30.2
PolicyLoss: -0.0189
Policy_Beta: 0.1
Policy_Entropy: 0.134
Policy_KL: 0.000823
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.08e+07
VF_0_ExplainedVarNew: 0.938
VF_0_ExplainedVarOld: 0.932
VF_0_Loss : 0.00753


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.0016858972322046073 0.009528235328127719 0.058590113869350986 -0.04787716209888454
ADV2:  -0.009045502155251456 0.9149115780488138 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3029   0.6292   3.2827  24.0260  15.5251  10.0673
ValFu

Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.0006063207531955129 0.010703759312326167 0.06228257456542585 -0.08026496677541783
ADV2:  0.004624795923384376 0.9292712380063193 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3092   0.8585   4.5391  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0017   5.4889   2.1784   2.1397
***** Episode 31471, Mean R = -16.6  Std R = 5.8  Min R = -30.1
PolicyLoss: -0.0112
Policy_Beta: 0.1
Policy_Entropy: 0.132
Policy_KL: 0.00089
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.09e+07
VF_0_ExplainedVarNew: 0.953
VF_0_ExplainedVarOld: 0.945
VF_0_Loss : 0.0221


ADV1:  -0.0024725119216469573 0.012229083036332614 0.10169214786766118 -0.07244607959701947
ADV2:  0.029563973949789164 0.8859265387806294 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1498   0.7782   3.5615  24.0260  15.5251  10.0673
ValFun  

Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.0006550634660720763 0.01087920147527504 0.0644259801334241 -0.07534709836913084
ADV2:  0.020761564214499685 0.8929142192357705 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8801   1.0034   4.7484  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0017   5.4889   2.1784   2.1397
***** Episode 31750, Mean R = -16.7  Std R = 6.2  Min R = -38.5
PolicyLoss: -0.0214
Policy_Beta: 0.1
Policy_Entropy: 0.131
Policy_KL: 0.0012
Policy_SD: 0.562
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.1e+07
VF_0_ExplainedVarNew: 0.952
VF_0_ExplainedVarOld: 0.949
VF_0_Loss : 0.0222


ADV1:  -0.0006414631397738757 0.01103827894382343 0.0391200506009258 -0.0718944239758843
ADV2:  0.019876377382400345 0.9047551426239904 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7781   0.9481   4.2540  24.0260  15.5251  10.0673
ValFun  Gradie

***** Episode 31998, Mean R = -16.3  Std R = 4.7  Min R = -29.1
PolicyLoss: -0.0239
Policy_Beta: 0.1
Policy_Entropy: 0.133
Policy_KL: 0.000716
Policy_SD: 0.568
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.11e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.957
VF_0_Loss : 0.0219


ADV1:  -0.001857359139607832 0.009687806371260065 0.04892208669928041 -0.08453443186241336
ADV2:  0.03439341553775644 0.8355345677325282 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4340   0.7671   4.0829  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0019   0.0070   5.4889   2.1784   2.1397
***** Episode 32029, Mean R = -15.9  Std R = 5.4  Min R = -29.4
PolicyLoss: -0.0246
Policy_Beta: 0.1
Policy_Entropy: 0.133
Policy_KL: 0.00104
Policy_SD: 0.57
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.11e+07
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.955
VF_0_Loss : 0.0213


ADV1:  -0.0033615229998188744 0.011386303738808834 0.075785

***** Episode 32277, Mean R = -18.0  Std R = 13.0  Min R = -76.5
PolicyLoss: 0.046
Policy_Beta: 0.1
Policy_Entropy: 0.134
Policy_KL: 0.00113
Policy_SD: 0.576
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.12e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.784
VF_0_Loss : 0.0228


ADV1:  -0.0036351919515241362 0.01211244262826504 0.07115444721862357 -0.0632092759092126
ADV2:  0.023739662403155618 0.9441189942319352 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1233   1.4464   6.2410  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0043   0.0025   0.0095   5.4889   2.1784   2.1397
***** Episode 32308, Mean R = -17.0  Std R = 6.0  Min R = -35.7
PolicyLoss: -0.00446
Policy_Beta: 0.1
Policy_Entropy: 0.133
Policy_KL: 0.000918
Policy_SD: 0.568
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.12e+07
VF_0_ExplainedVarNew: 0.941
VF_0_ExplainedVarOld: 0.932
VF_0_Loss : 0.0172


ADV1:  -0.0016496167538138887 0.013281179477750406 0.0923

seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.99 |    0.99    0.99
cs_angles |  0.0041  0.0023 |  0.0860  0.0894 | -0.9991 -0.9910 |  0.9875  0.9853
optical_flow |  0.0001  0.0001 |  0.0258  0.0253 | -0.8694 -1.3846 |  1.1095  0.9705
v_err    | -0.0094 |  0.0578 | -0.4542 |  0.1170
landing_rewards |    8.65 |    3.42 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.07
tracking_rewards |  -21.46 |    4.67 |  -48.45 |  -13.69
steps    |     377 |      21 |     334 |     418
***** Episode 32587, Mean R = -17.5  Std R = 5.2  Min R = -28.0
PolicyLoss: -0.0117
Policy_Beta: 0.1
Policy_Entropy: 0.133
Policy_KL: 0.00122
Policy_SD: 0.564
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.13e+07
VF_0_ExplainedVarNew: 0.945
VF_0_ExplainedVarOld: 0.941
VF_0_Loss : 0.0326


ADV1:  0.0016302011916623435 0.010548813052561667 0.06264440056984771 -0.056157108873915784
ADV2:  0.0007990811855541424 0.9164822561536674 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max

attitude |   -0.07    0.03   -0.07 |    1.22    0.68    1.92 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.03 |    0.66    1.93 |   -1.51   -3.14 |    1.47    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.03    0.03
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.25 |    0.00 |    1.48
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -1.00 |    0.98    0.98
cs_angles |  0.0027  0.0010 |  0.0845  0.0845 | -0.9999 -0.9989 |  0.9805  0.9766
optical_flow |  0.0002 -0.0000 |  0.0277  0.0272 | -1.1064 -1.4101 |  1.2092  1.2903
v_err    | -0.0100 |  0.0582 | -0.4528 |  0.1271
landing_rewards |    8.84 |    3.20 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01    0.06    0.02 |    1.12    0.68    1.79 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.06    0.13 |    0.68    1.79 |   -1.51   -3.14 |    1.46    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.03    0.04
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.25 |    0.00 |    1.57
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.98   -1.00 |    1.00    1.00
cs_angles |  0.0019  0.0026 |  0.0831  0.0862 | -0.9835 -0.9953 |  0.9965  0.9977
optical_flow |  0.0001 -0.0001 |  0.0260  0.0252 | -1.1167 -1.2995 |  1.1703  0.9269
v_err    | -0.0097 |  0.0583 | -0.5000 |  0.1330
landing_rewards |    8.97 |    3.04 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.00    0.00 |    0.69    0.69    0.70 |   -3.22   -3.45   -3.44 |    3.35    3.39    3.45
norm_thrust |    0.94 |    0.75 |    0.00 |    3.46
fuel     |    1.67 |    0.20 |    1.25 |    2.27
rewards  |  -16.23 |    6.00 |  -43.96 |   -4.88
fuel_rewards |   -4.77 |    0.57 |   -6.48 |   -3.57
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.91 |   13.03 |    0.01 |  720.62
norm_af  |    1.62 |    0.89 |    0.03 |    3.27
norm_wf  |    0.02 |    0.01 |    0.00 |    0.06
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.02   -0.02    0.07 |    1.06    0.66    1.72 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.14 |    0.66

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2967   1.5819   8.1673  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0057   0.0036   0.0124   5.4889   2.1784   2.1397
Update Cnt = 1090    ET =   1169.0   Stats:  Mean, Std, Min, Max
r_f      |    4.27   -0.34   -8.98 |  179.28  169.56  207.32 | -390.90 -397.09 -382.95 |  398.48  397.20  387.01
v_f      |   -0.00   -0.00    0.00 |    0.04    0.05    0.05 |   -0.11   -0.11   -0.12 |    0.11    0.13    0.12
r_i      |    3.45   19.31  -43.94 |  670.63  646.09  783.40 |-1313.92-1290.43-1292.83 | 1338.60 1313.65 1344.44
v_i      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.09    0.09    0.09
norm_rf  |    0.27 |    0.11 |    0.03 |    0.65
norm_vf  |    0.08 |    0.02 |    0.04 |    0.13
gs_f     |    1.52 |    2.45 |    0.01 |   27.60
thrust   |   -0.00    0.01   -0.00 |    0.69    0.71    0.69 |   -3.36   -3.45   -3.44 |    3.45    3.45    3.39
norm_thrust |    

ADV1:  0.0007495651611409971 0.010939821442262217 0.05241093510920031 -0.06669405589456347
ADV2:  0.01506795447698454 0.8754065795023586 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8815   0.7980   4.3593  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0035   5.4889   2.1784   2.1397
***** Episode 34106, Mean R = -16.4  Std R = 6.4  Min R = -29.3
PolicyLoss: -0.0241
Policy_Beta: 0.1
Policy_Entropy: 0.135
Policy_KL: 0.000883
Policy_SD: 0.568
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.19e+07
VF_0_ExplainedVarNew: 0.945
VF_0_ExplainedVarOld: 0.943
VF_0_Loss : 0.0163


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.000838656300754582 0.010539196900649743 0.07299144399891672 -0.06027771094157759
ADV2:  0.012324195123391507 0.903436681828369 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1658   0.7903   4.2538  24.0260  15.5251  10.0673
ValFun  Gr

ADV1:  -0.00010309294105067533 0.010711285926835826 0.037887471132239156 -0.1152771285627206
ADV2:  0.02406258274568919 0.8654891860794279 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0507   0.4525   2.6282  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0004   5.4889   2.1784   2.1397
***** Episode 34385, Mean R = -16.4  Std R = 6.3  Min R = -31.3
PolicyLoss: -0.0275
Policy_Beta: 0.1
Policy_Entropy: 0.134
Policy_KL: 0.000948
Policy_SD: 0.563
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.2e+07
VF_0_ExplainedVarNew: 0.955
VF_0_ExplainedVarOld: 0.95
VF_0_Loss : 0.0117


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.00280633117620589 0.012545484369855845 0.0662121925414732 -0.0710274059537975
ADV2:  0.020383264927915347 0.9267811672349294 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0322   0.7804   4.0619  24.0260  15.5251  10.0673
ValFun  Grad

Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.0024109430927308504 0.006694254954323108 0.05256553103708017 -0.06620723523982336
ADV2:  -0.033519471904099166 0.9074172140104566 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0318   1.6457   7.9537  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0018   0.0064   5.4889   2.1784   2.1397
***** Episode 34664, Mean R = -14.7  Std R = 4.5  Min R = -24.3
PolicyLoss: 0.000645
Policy_Beta: 0.1
Policy_Entropy: 0.136
Policy_KL: 0.000789
Policy_SD: 0.564
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.21e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.0179


ADV1:  -0.005698084039107571 0.012739576003941419 0.03975593470597466 -0.09294775375082033
ADV2:  0.05097701478353547 0.8743260978931511 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3111   0.7568   4.1213  24.0260  15.5251  10.0673
ValFun 

Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.0010518998839997944 0.007859353237391674 0.08070984550207905 -0.0590263005920961
ADV2:  0.0035205326942584114 0.8861938968637149 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4180   1.3256   7.3795  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0027   5.4889   2.1784   2.1397
***** Episode 34943, Mean R = -15.4  Std R = 5.3  Min R = -26.6
PolicyLoss: -0.0156
Policy_Beta: 0.1
Policy_Entropy: 0.137
Policy_KL: 0.000844
Policy_SD: 0.558
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.22e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.0325


ADV1:  5.034708079869482e-05 0.006999865954044616 0.04019562065673282 -0.05013658744011807
ADV2:  0.01087957950302669 0.8934711803022083 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8762   0.3208   1.9839  24.0260  15.5251  10.0673
ValFun  G

***** Episode 35191, Mean R = -15.1  Std R = 4.8  Min R = -25.7
PolicyLoss: -0.0209
Policy_Beta: 0.1
Policy_Entropy: 0.138
Policy_KL: 0.000941
Policy_SD: 0.551
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 1.23e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.0113


ADV1:  -0.0019165884178479215 0.00960540567291063 0.050805510083834375 -0.08405282344892283
ADV2:  0.035619436378549654 0.8495550222444589 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1040   1.2910   6.6201  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0014   0.0050   5.4889   2.1784   2.1397
***** Episode 35222, Mean R = -15.6  Std R = 5.4  Min R = -31.5
PolicyLoss: -0.0289
Policy_Beta: 0.1
Policy_Entropy: 0.136
Policy_KL: 0.00092
Policy_SD: 0.552
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 1.23e+07
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.955
VF_0_Loss : 0.0105


ADV1:  0.001772880764845282 0.008800513671170445 0.05861

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8264   1.0421   4.3964  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0020   0.0066   5.4889   2.1784   2.1397
***** Episode 35470, Mean R = -15.2  Std R = 5.3  Min R = -28.7
PolicyLoss: -0.00191
Policy_Beta: 0.1
Policy_Entropy: 0.138
Policy_KL: 0.00084
Policy_SD: 0.551
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.24e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.0163


ADV1:  -0.004367474420278841 0.010792858634172809 0.060419155457762386 -0.07591289137832874
ADV2:  0.04133058367971157 0.9203959785087356 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2802   2.1064  10.8740  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0054   0.0033   0.0120   5.4889   2.1784   2.1397
***** Episode 35501, Mean R = -17.1  Std R = 6.6  Min R = -37.4
PolicyLoss: -0.0145
Policy_Beta: 0.1
Policy_Entropy: 0.137
Policy_KL: 0.00107
Poli

ADV1:  -0.0018819128996736825 0.011104163477773592 0.06206687981383244 -0.08170952158114259
ADV2:  0.025582934494806673 0.9037245299177888 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0635   1.1048   5.8328  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0016   0.0068   5.4889   2.1784   2.1397
***** Episode 35749, Mean R = -16.6  Std R = 5.6  Min R = -28.3
PolicyLoss: -0.0173
Policy_Beta: 0.1
Policy_Entropy: 0.137
Policy_KL: 0.00116
Policy_SD: 0.557
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.25e+07
VF_0_ExplainedVarNew: 0.941
VF_0_ExplainedVarOld: 0.937
VF_0_Loss : 0.0146


ADV1:  0.002148357667780524 0.008296561082592423 0.06001703254835228 -0.055326070968271274
ADV2:  -0.0033905445886170584 0.8916620257377631 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2911   1.5026   8.1942  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0017   0.0068   5.4889   2.1784   2.1

ADV1:  0.0017385372520850118 0.007833736915038789 0.04631139068598589 -0.04842039460094777
ADV2:  -0.0024864449542031423 0.9034717894994038 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3965   0.5805   3.4238  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0011   0.0046   5.4889   2.1784   2.1397
***** Episode 36028, Mean R = -16.2  Std R = 6.4  Min R = -30.1
PolicyLoss: -0.017
Policy_Beta: 0.1
Policy_Entropy: 0.139
Policy_KL: 0.00101
Policy_SD: 0.564
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.26e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.0121


ADV1:  -0.0029179977191443815 0.009174164098981585 0.04435639313888107 -0.06123809040554286
ADV2:  0.041533111792128 0.8844704161028395 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1623   0.4576   2.5870  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0019   0.0077   5.4889   2.1784   2.1397


optical_flow |  0.0001 -0.0001 |  0.0262  0.0253 | -1.2298 -1.2954 |  1.2272  1.4616
v_err    | -0.0102 |  0.0587 | -0.4530 |  0.1205
landing_rewards |    9.06 |    2.91 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.04
tracking_rewards |  -20.63 |    4.47 |  -34.11 |  -11.07
steps    |     376 |      20 |     332 |     416
***** Episode 36307, Mean R = -15.9  Std R = 6.9  Min R = -27.8
PolicyLoss: -0.0263
Policy_Beta: 0.1
Policy_Entropy: 0.139
Policy_KL: 0.000952
Policy_SD: 0.567
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.27e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.0121


ADV1:  -0.0018077795086502923 0.01116495962423709 0.06910626399826136 -0.06613138568827746
ADV2:  0.027798556425938977 0.8896261321886436 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2529   0.7936   4.1713  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0014   0.0049   5.4889   2.1784   2.1397


w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00   -0.00 |    0.64    1.81 |   -1.45   -3.14 |    1.52    3.06
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.02 |    0.05    0.03    0.03
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.25 |    0.00 |    1.35
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -1.00   -0.98 |    0.98    1.00
cs_angles |  0.0036 -0.0007 |  0.0802  0.0832 | -0.9982 -0.9840 |  0.9846  0.9980
optical_flow |  0.0001 -0.0001 |  0.0250  0.0253 | -0.9467 -1.0732 |  0.9448  1.1535
v_err    | -0.0094 |  0.0582 | -0.4997 |  0.1199
landing_rewards |    9.23 |    2.67 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.03
tracking_rewards |  -19.85 |    4.74 |  -49.53 |  -11.24
steps    |     378 |  

attitude |    0.03   -0.05   -0.06 |    1.12    0.63    1.83 |   -3.14   -1.57   -3.14 |    3.14    1.48    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05   -0.07 |    0.64    1.83 |   -1.47   -3.14 |    1.45    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.05    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.25 |    0.00 |    1.45
seeker_angles |    0.01    0.00 |    0.08    0.08 |   -0.97   -1.00 |    0.99    1.00
cs_angles |  0.0061  0.0026 |  0.0821  0.0842 | -0.9700 -0.9986 |  0.9926  0.9953
optical_flow | -0.0000 -0.0001 |  0.0270  0.0263 | -1.0117 -1.2044 |  1.4370  0.9330
v_err    | -0.0095 |  0.0588 | -0.4513 |  0.1170
landing_rewards |    9.06 |    2.91 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.10    0.10    0.19 |    1.13    0.63    1.84 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.09    0.24 |    0.64    1.82 |   -1.45   -3.14 |    1.45    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.02 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.25 |    0.00 |    1.50
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.96 |    0.98    0.98
cs_angles |  0.0036  0.0042 |  0.0828  0.0827 | -0.9942 -0.9643 |  0.9840  0.9808
optical_flow |  0.0001 -0.0001 |  0.0278  0.0247 | -1.3587 -1.0014 |  1.0821  1.1375
v_err    | -0.0096 |  0.0579 | -0.4529 |  0.1167
landing_rewards |    9.16 |    2.77 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00   -0.00    0.00 |    0.68    0.68    0.68 |   -3.44   -3.40   -3.41 |    3.42    3.46    3.43
norm_thrust |    0.91 |    0.75 |    0.00 |    3.46
fuel     |    1.58 |    0.21 |    1.12 |    2.29
rewards  |  -15.55 |    5.93 |  -37.08 |   -6.46
fuel_rewards |   -4.52 |    0.61 |   -6.56 |   -3.20
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.96 |   12.83 |    0.00 |  534.50
norm_af  |    1.72 |    0.90 |    0.12 |    3.28
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.05   -0.01    0.02 |    1.15    0.64    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.03 |    0.64

ADV1:  -0.000253444550646023 0.007275060728249799 0.03816225433326508 -0.09554265522296002
ADV2:  0.022124544786647608 0.8377096787570737 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1108   1.4540   6.9472  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0005   0.0021   5.4889   2.1784   2.1397
Update Cnt = 1220    ET =   1117.1   Stats:  Mean, Std, Min, Max
r_f      |  -10.54   -0.48   -0.66 |  184.74  168.87  200.23 | -382.25 -367.41 -389.03 |  378.41  386.83  395.76
v_f      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.13   -0.09   -0.10 |    0.12    0.11    0.11
r_i      |  -12.64   -2.14  -41.45 |  700.65  635.16  759.48 |-1280.63-1360.03-1332.07 | 1303.41 1319.87 1291.97
v_i      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.10   -0.10 |    0.09    0.09    0.10
norm_rf  |    0.26 |    0.11 |    0.04 |    0.67
norm_vf  |    0.08 |    0.02 |    0.04 |    0.13
gs_f     |    1.37 |    2.06 |  

Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.0018236754913149745 0.00957262240300396 0.06281485572230248 -0.05592145630053247
ADV2:  0.0005525874758827841 0.8888518321799068 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4216   0.8276   4.1968  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0048   5.4889   2.1784   2.1397
***** Episode 38136, Mean R = -15.1  Std R = 4.5  Min R = -25.8
PolicyLoss: -0.0178
Policy_Beta: 0.1
Policy_Entropy: 0.141
Policy_KL: 0.000858
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.34e+07
VF_0_ExplainedVarNew: 0.956
VF_0_ExplainedVarOld: 0.954
VF_0_Loss : 0.00549


ADV1:  0.00013640782808346615 0.01001359581787697 0.05093882592655222 -0.08716375677541793
ADV2:  0.01569534196377626 0.8864269111018397 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2714   0.7876   4.3033  24.0260  15.5251  10.0673
ValFun  

***** Episode 38384, Mean R = -14.7  Std R = 4.7  Min R = -31.5
PolicyLoss: -0.0329
Policy_Beta: 0.1
Policy_Entropy: 0.137
Policy_KL: 0.00102
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.35e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.961
VF_0_Loss : 0.00353


ADV1:  -0.000157368457803008 0.008870096447925163 0.05769443715557854 -0.059182125901860456
ADV2:  0.01674726895534657 0.8638649389560652 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8643   0.9725   4.0636  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0005   5.4889   2.1784   2.1397
***** Episode 38415, Mean R = -16.8  Std R = 5.0  Min R = -30.0
PolicyLoss: -0.0192
Policy_Beta: 0.1
Policy_Entropy: 0.141
Policy_KL: 0.00072
Policy_SD: 0.559
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.35e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 0.00403


ADV1:  -0.0011428383200478137 0.009898872661509487 0.06

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9715   1.1383   5.7888  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0003   0.0017   5.4889   2.1784   2.1397
***** Episode 38663, Mean R = -14.3  Std R = 5.1  Min R = -32.3
PolicyLoss: -0.0277
Policy_Beta: 0.1
Policy_Entropy: 0.141
Policy_KL: 0.00103
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.36e+07
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.955
VF_0_Loss : 0.00728


ADV1:  -0.0009386458560317118 0.00965783059256799 0.06934950979911808 -0.07003866989300533
ADV2:  0.02917220005909458 0.8592964695884161 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5576   0.9884   5.2604  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0025   5.4889   2.1784   2.1397
***** Episode 38694, Mean R = -15.8  Std R = 5.5  Min R = -26.8
PolicyLoss: -0.026
Policy_Beta: 0.1
Policy_Entropy: 0.14
Policy_KL: 0.000901
Policy

ADV1:  -0.00028468269362805194 0.00960199977125028 0.042163655757904095 -0.07967481255531311
ADV2:  0.023882069599667714 0.8734205884800302 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7662   1.3286   7.5381  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0011   0.0042   5.4889   2.1784   2.1397
***** Episode 38942, Mean R = -16.6  Std R = 6.1  Min R = -30.3
PolicyLoss: -0.0262
Policy_Beta: 0.1
Policy_Entropy: 0.138
Policy_KL: 0.000804
Policy_SD: 0.572
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.37e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.965
VF_0_Loss : 0.00768


ADV1:  0.002888596461708544 0.006835121856040049 0.10155069811848938 -0.06654109105632372
ADV2:  -0.029843996535690503 0.8592521684923449 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0932   0.8748   4.1249  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0020   0.0076   5.4889   2.1784   2.

ADV1:  -0.001755112100733849 0.00968370899876015 0.0830392979010543 -0.08158323875178758
ADV2:  0.030221489582946043 0.8427701582182698 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2032   0.7161   3.9536  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0011   0.0046   5.4889   2.1784   2.1397
***** Episode 39221, Mean R = -15.8  Std R = 5.6  Min R = -26.2
PolicyLoss: -0.0211
Policy_Beta: 0.1
Policy_Entropy: 0.142
Policy_KL: 0.000977
Policy_SD: 0.567
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.38e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.00998


ADV1:  0.0004529064600099551 0.010342777718096092 0.06620956696304658 -0.06893791696632641
ADV2:  0.011599998162230202 0.8857393874434172 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8726   1.4893   7.6547  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   5.4889   2.1784   2.1397

ADV1:  0.0006975515930954282 0.009031880167775785 0.07002214279785829 -0.06839671853421561
ADV2:  0.00549704026105005 0.8622044859871973 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9165   1.9877   9.9667  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0031   5.4889   2.1784   2.1397
***** Episode 39500, Mean R = -15.0  Std R = 5.0  Min R = -26.7
PolicyLoss: -0.0146
Policy_Beta: 0.1
Policy_Entropy: 0.141
Policy_KL: 0.000661
Policy_SD: 0.559
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.39e+07
VF_0_ExplainedVarNew: 0.967
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.0163


ADV1:  0.000492825091450402 0.008606764652309747 0.03880972322704096 -0.07521003436976792
ADV2:  0.020399351479650794 0.8526988017035062 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7547   0.7045   3.3785  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0023   5.4889   2.1784   2.1397


ADV1:  -0.0001441605372768524 0.009083571753191605 0.05768276430194125 -0.0854066157341003
ADV2:  0.020179139760453796 0.8655737917034557 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0847   0.9409   4.2034  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0014   5.4889   2.1784   2.1397
***** Episode 39779, Mean R = -14.6  Std R = 5.0  Min R = -29.2
PolicyLoss: -0.0233
Policy_Beta: 0.1
Policy_Entropy: 0.146
Policy_KL: 0.00092
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.4e+07
VF_0_ExplainedVarNew: 0.962
VF_0_ExplainedVarOld: 0.957
VF_0_Loss : 0.0172


ADV1:  -0.0008975881312643073 0.010473803773450651 0.0432838732587974 -0.07687757568587705
ADV2:  0.027585996110474492 0.8655842793538018 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4578   1.6743   6.7641  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0026   5.4889   2.1784   2.1397


ADV1:  0.0018020136827838016 0.007731090831353366 0.05850318595921583 -0.0964545885126521
ADV2:  0.005296539746148485 0.8144674270152303 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4732   0.5817   3.4017  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0010   0.0048   5.4889   2.1784   2.1397
***** Episode 40058, Mean R = -16.4  Std R = 6.4  Min R = -37.0
PolicyLoss: -0.024
Policy_Beta: 0.1
Policy_Entropy: 0.145
Policy_KL: 0.000977
Policy_SD: 0.557
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.41e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.0146


ADV1:  -0.0025395602074690313 0.008754790862487972 0.06311718225067459 -0.06874956479959046
ADV2:  0.039185464670540154 0.8388217383718559 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2299   1.2169   6.7719  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0019   0.0067   5.4889   2.1784   2.1397

seeker_angles |    0.00    0.00 |    0.08    0.09 |   -1.00   -1.00 |    0.98    0.99
cs_angles |  0.0049  0.0029 |  0.0808  0.0856 | -0.9957 -0.9959 |  0.9791  0.9902
optical_flow | -0.0000 -0.0001 |  0.0279  0.0262 | -1.0635 -1.1212 |  1.2584  1.1424
v_err    | -0.0098 |  0.0587 | -0.4878 |  0.1125
landing_rewards |    9.29 |    2.57 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.03
tracking_rewards |  -19.84 |    4.43 |  -41.00 |  -10.91
steps    |     376 |      21 |     331 |     417
***** Episode 40337, Mean R = -15.1  Std R = 5.7  Min R = -33.4
PolicyLoss: -0.012
Policy_Beta: 0.1
Policy_Entropy: 0.145
Policy_KL: 0.00091
Policy_SD: 0.549
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.42e+07
VF_0_ExplainedVarNew: 0.944
VF_0_ExplainedVarOld: 0.941
VF_0_Loss : 0.0218


ADV1:  0.0024846911615900363 0.010084646382399707 0.05059975562129665 -0.05814612907592276
ADV2:  -0.0003313994383667352 0.8776350150223388 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max 

attitude |   -0.03    0.01    0.06 |    1.15    0.66    1.79 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.01 |    0.65    1.77 |   -1.39   -3.13 |    1.51    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.24 |    0.00 |    1.58
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0039  0.0026 |  0.0798  0.0804 | -0.9954 -0.9983 |  0.9898  0.9977
optical_flow | -0.0000 -0.0001 |  0.0275  0.0260 | -1.1196 -1.4415 |  1.3104  0.9234
v_err    | -0.0099 |  0.0585 | -0.4533 |  0.1086
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

glideslope |    2.89 |   13.43 |    0.01 | 1391.24
norm_af  |    1.74 |    0.91 |    0.10 |    3.38
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.08   -0.03   -0.12 |    1.14    0.64    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02   -0.01 |    0.64    1.86 |   -1.49   -3.09 |    1.45    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.05    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.26 |    0.00 |    1.48
seeker_angles |    0.01    0.01 |    0.08    0.09 |   -0.98   -0.99 |    1.

attitude |    0.06    0.07    0.07 |    1.24    0.66    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.07    0.03 |    0.66    1.82 |   -1.40   -3.13 |    1.54    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.25 |    0.00 |    1.46
seeker_angles |    0.00    0.01 |    0.08    0.08 |   -0.99   -1.00 |    0.98    1.00
cs_angles |  0.0039  0.0054 |  0.0802  0.0821 | -0.9918 -0.9986 |  0.9846  0.9982
optical_flow |  0.0000  0.0000 |  0.0271  0.0263 | -1.1227 -1.2011 |  1.1330  1.3361
v_err    | -0.0097 |  0.0589 | -0.4522 |  0.1328
landing_rewards |    9.23 |    2.67 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.08    0.02   -0.03 |    1.09    0.64    1.80 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.05 |    0.64    1.79 |   -1.45   -3.14 |    1.56    3.12
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.25 |    0.00 |    1.40
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0027  0.0043 |  0.0840  0.0820 | -0.9965 -0.9960 |  0.9863  0.9990
optical_flow |  0.0001 -0.0001 |  0.0270  0.0257 | -1.1739 -1.0493 |  1.1988  1.1871
v_err    | -0.0097 |  0.0587 | -0.4949 |  0.1343
landing_rewards |    9.29 |    2.57 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04   -0.09 |    0.68    1.90 |   -1.50   -3.14 |    1.48    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.24 |    0.00 |    1.49
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.97   -1.00 |    1.00    0.98
cs_angles |  0.0042  0.0018 |  0.0781  0.0815 | -0.9713 -0.9961 |  0.9978  0.9775
optical_flow | -0.0000  0.0000 |  0.0282  0.0258 | -1.3105 -1.1256 |  1.3835  1.2651
v_err    | -0.0098 |  0.0583 | -0.4527 |  0.1249
landing_rewards |    9.35 |    2.46 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.06 |    0.03
tracking_rewards |  -19.08 |    4.28 |  -34.53 |  -10.61
steps    |     377 |  

w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.08    0.00 |    0.68    1.84 |   -1.51   -3.14 |    1.50    3.11
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.25 |    0.00 |    1.51
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    1.00    1.00
cs_angles |  0.0020  0.0037 |  0.0828  0.0841 | -0.9989 -0.9944 |  0.9986  0.9975
optical_flow |  0.0001  0.0002 |  0.0273  0.0257 | -1.1193 -1.1471 |  1.5757  1.3157
v_err    | -0.0103 |  0.0582 | -0.4557 |  0.1219
landing_rewards |    9.16 |    2.77 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.04
tracking_rewards |  -19.96 |    5.31 |  -71.72 |  -11.61
steps    |     378 |  

attitude |   -0.04   -0.01   -0.07 |    1.20    0.68    1.86 |   -3.14   -1.53   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00   -0.14 |    0.68    1.85 |   -1.43   -3.12 |    1.51    3.12
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.26 |    0.00 |    1.46
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.94   -0.99 |    0.98    0.99
cs_angles |  0.0015  0.0027 |  0.0850  0.0846 | -0.9415 -0.9864 |  0.9792  0.9889
optical_flow |  0.0000 -0.0000 |  0.0255  0.0236 | -1.2453 -1.1520 |  0.9309  1.1037
v_err    | -0.0097 |  0.0581 | -0.4528 |  0.1233
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.05   -0.04   -0.01 |    1.11    0.64    1.84 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04   -0.10 |    0.65    1.84 |   -1.54   -3.14 |    1.52    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.25 |    0.00 |    1.55
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -0.99 |    1.00    0.97
cs_angles |  0.0029  0.0008 |  0.0806  0.0850 | -0.9873 -0.9922 |  0.9992  0.9694
optical_flow | -0.0001 -0.0000 |  0.0265  0.0265 | -1.0774 -1.2157 |  1.1213  1.1754
v_err    | -0.0099 |  0.0585 | -0.4955 |  0.1067
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.00   -0.00 |    0.68    0.69    0.68 |   -3.45   -3.34   -3.43 |    3.39    3.38    3.35
norm_thrust |    0.91 |    0.75 |    0.00 |    3.46
fuel     |    1.59 |    0.20 |    1.08 |    2.29
rewards  |  -14.45 |    5.61 |  -35.84 |   -5.05
fuel_rewards |   -4.56 |    0.57 |   -6.56 |   -3.08
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.82 |   12.84 |    0.01 |  463.81
norm_af  |    1.74 |    0.91 |    0.03 |    3.36
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.11   -0.03   -0.08 |    1.21    0.69    1.85 |   -3.14   -1.51   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03   -0.02 |    0.68

ADV1:  -0.0006253646602384243 0.008848610445945187 0.04572998650374396 -0.04729670652466872
ADV2:  0.01901708640216508 0.8823950029475365 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6020   1.1134   5.9187  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0017   5.4889   2.1784   2.1397
Update Cnt = 1400    ET =   1018.2   Stats:  Mean, Std, Min, Max
r_f      |    8.22   -4.24   14.57 |  179.35  170.16  205.38 | -381.29 -381.71 -374.64 |  380.71  371.51  394.59
v_f      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.12   -0.10   -0.10 |    0.09    0.12    0.10
r_i      |   60.17  -34.61   42.68 |  659.26  658.54  782.55 |-1289.88-1316.68-1307.30 | 1290.40 1322.22 1377.37
v_i      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.10    0.09
norm_rf  |    0.25 |    0.10 |    0.02 |    0.58
norm_vf  |    0.07 |    0.02 |    0.04 |    0.14
gs_f     |    1.66 |    4.88 |  

ADV1:  -0.0014899586793537232 0.011121243670277286 0.03651313821964974 -0.13324374561391517
ADV2:  0.029111210163485404 0.8706697279473115 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9284   0.8692   4.6096  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0012   0.0045   5.4889   2.1784   2.1397
***** Episode 43716, Mean R = -16.4  Std R = 6.2  Min R = -31.6
PolicyLoss: -0.0231
Policy_Beta: 0.1
Policy_Entropy: 0.145
Policy_KL: 0.000701
Policy_SD: 0.571
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.55e+07
VF_0_ExplainedVarNew: 0.961
VF_0_ExplainedVarOld: 0.951
VF_0_Loss : 0.00289


ADV1:  0.001018779799200912 0.00916018780775402 0.08166565755228389 -0.06553606341083906
ADV2:  0.0061907506198043616 0.8637769043143767 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2754   0.6207   3.6082  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0009   0.0035   5.4889   2.1784   2.13

ADV1:  -0.0018752614680548159 0.01050098082672836 0.040031647268744974 -0.05985593816154793
ADV2:  0.028869773809764823 0.8981559052254315 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8923   1.3598   6.6563  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0015   0.0050   5.4889   2.1784   2.1397
***** Episode 43995, Mean R = -16.2  Std R = 7.1  Min R = -34.8
PolicyLoss: -0.0205
Policy_Beta: 0.1
Policy_Entropy: 0.145
Policy_KL: 0.000765
Policy_SD: 0.568
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.56e+07
VF_0_ExplainedVarNew: 0.959
VF_0_ExplainedVarOld: 0.956
VF_0_Loss : 0.0107


ADV1:  0.0020584877945230857 0.011218164375316628 0.06026038703037767 -0.07623354509498517
ADV2:  0.0008660420664621479 0.892733821398318 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6384   1.6295   8.7308  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0017   0.0061   5.4889   2.1784   2.13

ADV1:  0.000862023813311732 0.006867780555439219 0.049562966922240353 -0.04592383093590341
ADV2:  0.0012885919158202132 0.8678486221509125 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0854   0.4807   2.3630  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0023   5.4889   2.1784   2.1397
***** Episode 44274, Mean R = -11.6  Std R = 3.4  Min R = -19.4
PolicyLoss: -0.0151
Policy_Beta: 0.1
Policy_Entropy: 0.147
Policy_KL: 0.00105
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.57e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 0.00442


ADV1:  -0.0009153461023660465 0.008361049827329967 0.04682088037331903 -0.05801019236151832
ADV2:  0.033513591182438573 0.8460148213886709 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2896   1.2225   6.9235  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0024   5.4889   2.1784   2.1

ADV1:  -0.0025494630145049208 0.009881097135738651 0.06323913656042568 -0.09026285946369167
ADV2:  0.034284870771651745 0.8875206053706152 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2875   2.2988   8.6196  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0019   0.0067   5.4889   2.1784   2.1397
***** Episode 44553, Mean R = -13.9  Std R = 5.5  Min R = -28.6
PolicyLoss: -0.0211
Policy_Beta: 0.1
Policy_Entropy: 0.145
Policy_KL: 0.000871
Policy_SD: 0.545
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.58e+07
VF_0_ExplainedVarNew: 0.953
VF_0_ExplainedVarOld: 0.949
VF_0_Loss : 0.015


ADV1:  0.002696618301872155 0.008586430690445465 0.05603149564919413 -0.07414518754292476
ADV2:  -0.013911025778253231 0.8754441142400988 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2660   0.7784   3.8953  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0020   0.0071   5.4889   2.1784   2.139

ADV1:  0.0009522333953130025 0.007162483821148243 0.04202063516857463 -0.07393198843694332
ADV2:  0.003890879250083467 0.8870521999171971 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7381   0.9147   5.2044  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0025   5.4889   2.1784   2.1397
***** Episode 44832, Mean R = -11.7  Std R = 3.5  Min R = -18.3
PolicyLoss: -0.0172
Policy_Beta: 0.1
Policy_Entropy: 0.146
Policy_KL: 0.000805
Policy_SD: 0.549
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.59e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.0364


ADV1:  -0.0010110242237167321 0.007704953732900821 0.061092321843764286 -0.07133577083835307
ADV2:  0.02249467601490542 0.8660734588609907 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5214   0.7994   3.7827  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0026   5.4889   2.1784   2.13

ADV1:  0.0013314746441849485 0.009792340256573308 0.052948328499176744 -0.0692924307639104
ADV2:  0.0008638038330647446 0.9222468928939606 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6986   1.7744   8.1925  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0038   5.4889   2.1784   2.1397
***** Episode 45111, Mean R = -15.6  Std R = 6.0  Min R = -31.1
PolicyLoss: -0.013
Policy_Beta: 0.1
Policy_Entropy: 0.148
Policy_KL: 0.000857
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.6e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.00383


ADV1:  0.0015753511174372366 0.007170365104813597 0.03497424043294768 -0.06382422940139831
ADV2:  -0.0003359082373753341 0.8942434873837183 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.8343   2.7408  10.1317  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0042   5.4889   2.1784   2.1

ADV1:  0.0008461912967046233 0.007272827573774485 0.044193417266345514 -0.05729340707069726
ADV2:  0.01607552337137664 0.8318403946551487 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2003   0.8373   4.4461  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0022   5.4889   2.1784   2.1397
***** Episode 45390, Mean R = -12.6  Std R = 3.9  Min R = -22.0
PolicyLoss: -0.0277
Policy_Beta: 0.1
Policy_Entropy: 0.149
Policy_KL: 0.000903
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.61e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.012


ADV1:  -0.0020811616804785674 0.009038496319284906 0.04173061350612006 -0.08583150034049891
ADV2:  0.034654941937663115 0.8883540514376017 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0531   0.5405   2.5571  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0015   0.0054   5.4889   2.1784   2.139

ADV1:  0.002901727127879418 0.006217464072398147 0.049232218511469306 -0.0459883180404552
ADV2:  -0.024789986586946013 0.9118326798658594 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6208   1.8054   7.5226  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0076   5.4889   2.1784   2.1397
***** Episode 45669, Mean R = -13.7  Std R = 4.7  Min R = -22.7
PolicyLoss: -0.00685
Policy_Beta: 0.1
Policy_Entropy: 0.15
Policy_KL: 0.0012
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.63e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00538


ADV1:  -0.002123873409225637 0.007741835131208021 0.029943695465047437 -0.06251062452379995
ADV2:  0.041159016913264276 0.8603608356611376 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8680   1.1024   5.6764  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0055   5.4889   2.1784   2.139

ADV1:  0.0005392710131326737 0.009192640638068792 0.047937726089147426 -0.06650485951424734
ADV2:  0.017071023844485687 0.8613540822411699 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7347   0.8996   4.9643  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0017   5.4889   2.1784   2.1397
***** Episode 45948, Mean R = -14.6  Std R = 5.1  Min R = -25.6
PolicyLoss: -0.0253
Policy_Beta: 0.1
Policy_Entropy: 0.151
Policy_KL: 0.00122
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.64e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.00398


ADV1:  -0.001816754923893284 0.009915390507696185 0.06679102715294005 -0.056505969730469605
ADV2:  0.02663534035642399 0.9048453171204273 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1226   0.6778   3.7568  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0013   0.0047   5.4889   2.1784   2.139

cs_angles |  0.0040  0.0016 |  0.0809  0.0838 | -0.9899 -0.9911 |  0.9974  0.9777
optical_flow |  0.0000  0.0001 |  0.0269  0.0260 | -1.2338 -1.0278 |  1.3416  1.2008
v_err    | -0.0100 |  0.0582 | -0.4531 |  0.1137
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.06 |    0.02
tracking_rewards |  -19.10 |    4.14 |  -33.15 |  -11.00
steps    |     377 |      20 |     334 |     420
***** Episode 46227, Mean R = -13.6  Std R = 4.6  Min R = -24.4
PolicyLoss: -0.000119
Policy_Beta: 0.1
Policy_Entropy: 0.152
Policy_KL: 0.000894
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.65e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00615


ADV1:  -0.0027523099832763615 0.007833736141574857 0.056984673202902625 -0.06613946956002595
ADV2:  0.04800321749474754 0.8453269667597346 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2169   1.1146   5.7238  24.0260  15.5251  10.0673
ValFun  Gradients

theta_cv |    0.25 |    0.25 |    0.00 |    1.45
seeker_angles |    0.01   -0.00 |    0.08    0.09 |   -0.98   -0.99 |    1.00    0.98
cs_angles |  0.0067 -0.0006 |  0.0791  0.0866 | -0.9790 -0.9908 |  0.9996  0.9831
optical_flow |  0.0001 -0.0000 |  0.0263  0.0269 | -1.1006 -1.2214 |  1.0000  1.2317
v_err    | -0.0099 |  0.0586 | -0.4529 |  0.1096
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.03
tracking_rewards |  -19.08 |    5.85 |  -87.74 |  -11.24
steps    |     377 |      21 |     330 |     418
***** Episode 46537, Mean R = -13.8  Std R = 3.6  Min R = -23.1
PolicyLoss: -0.0167
Policy_Beta: 0.1
Policy_Entropy: 0.151
Policy_KL: 0.000935
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.66e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.0438


ADV1:  -0.00022076644336457935 0.007901322987903527 0.045638785759607996 -0.09761204564931336
ADV2:  0.024755982749630142 0.808200246072

attitude |   -0.01    0.03   -0.04 |    1.18    0.64    1.86 |   -3.14   -1.54   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.01 |    0.64    1.86 |   -1.47   -3.14 |    1.50    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.24 |    0.00 |    1.48
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.99 |    0.99    0.99
cs_angles |  0.0049  0.0029 |  0.0755  0.0800 | -0.9761 -0.9884 |  0.9882  0.9881
optical_flow |  0.0000  0.0002 |  0.0259  0.0249 | -1.3829 -1.1303 |  1.2015  1.0089
v_err    | -0.0101 |  0.0585 | -0.4523 |  0.1097
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.01   -0.00   -0.12 |    1.15    0.66    1.80 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.10 |    0.66    1.82 |   -1.47   -3.14 |    1.54    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.47
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0020  0.0022 |  0.0798  0.0809 | -0.9859 -0.9964 |  0.9968  0.9935
optical_flow |  0.0001  0.0001 |  0.0255  0.0240 | -1.0486 -1.2584 |  1.1544  1.1385
v_err    | -0.0105 |  0.0586 | -0.4526 |  0.1074
landing_rewards |    9.32 |    2.51 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00   -0.00   -0.00 |    0.66    0.67    0.68 |   -3.41   -3.31   -3.42 |    3.45    3.36    3.34
norm_thrust |    0.89 |    0.75 |    0.00 |    3.46
fuel     |    1.57 |    0.17 |    1.20 |    2.08
rewards  |  -13.22 |    5.11 |  -31.80 |   -5.20
fuel_rewards |   -4.49 |    0.50 |   -5.95 |   -3.44
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.92 |   12.82 |    0.01 |  292.54
norm_af  |    1.77 |    0.90 |    0.12 |    3.33
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.09    0.01   -0.05 |    1.31    0.67    1.89 |   -3.14   -1.53   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.03 |    0.67

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1872   0.5717   2.7782  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0025   5.4889   2.1784   2.1397
Update Cnt = 1540    ET =    951.0   Stats:  Mean, Std, Min, Max
r_f      |  -11.86   -4.03  -25.75 |  190.50  174.12  191.83 | -380.21 -366.05 -392.21 |  392.09  389.56  375.66
v_f      |   -0.00    0.00    0.01 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.09    0.10
r_i      |  -44.87  -18.63  -99.13 |  689.11  669.66  744.72 |-1335.42-1279.53-1286.79 | 1340.54 1297.77 1362.98
v_i      |    0.00    0.00    0.01 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.10    0.09    0.10
norm_rf  |    0.24 |    0.09 |    0.02 |    0.51
norm_vf  |    0.07 |    0.02 |    0.04 |    0.12
gs_f     |    1.26 |    1.94 |    0.01 |   15.95
thrust   |    0.00   -0.00   -0.00 |    0.68    0.69    0.68 |   -3.45   -3.35   -3.45 |    3.44    3.46    3.44
norm_thrust |    

ADV1:  -0.00023888215538795518 0.009403808972993281 0.05318932500411733 -0.05329943333078298
ADV2:  0.01595690102468684 0.9013398348445969 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4645   1.2352   5.2045  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0009   5.4889   2.1784   2.1397
***** Episode 48056, Mean R = -13.7  Std R = 5.5  Min R = -29.5
PolicyLoss: -0.0184
Policy_Beta: 0.1
Policy_Entropy: 0.153
Policy_KL: 0.00107
Policy_SD: 0.527
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 1.72e+07
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.956
VF_0_Loss : 0.00431


ADV1:  0.0005801193839712266 0.00665356126115698 0.03905030991491887 -0.04988696167495721
ADV2:  0.008464458670604635 0.8765221780661279 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7411   0.7174   3.3211  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   5.4889   2.1784   2.1397

ADV1:  -0.0011134150360188415 0.005924516668661715 0.040038607703134665 -0.08085676734240621
ADV2:  0.025398851102436715 0.8363320245887546 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5352   0.7668   3.9468  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0029   5.4889   2.1784   2.1397
***** Episode 48335, Mean R = -13.1  Std R = 3.5  Min R = -21.4
PolicyLoss: -0.0136
Policy_Beta: 0.1
Policy_Entropy: 0.15
Policy_KL: 0.000848
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.73e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.00302


ADV1:  -0.0010330012792058852 0.008109293391012394 0.0622198211103836 -0.06308211502809992
ADV2:  0.03215691375487126 0.8314226138164567 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2781   1.2521   6.8048  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0027   5.4889   2.1784   2.13

ADV1:  0.0006515743510084657 0.009404018236694414 0.06793203481514543 -0.134448435605644
ADV2:  0.019263070900347287 0.8193879613286174 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1744   0.8939   4.5102  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0018   5.4889   2.1784   2.1397
***** Episode 48614, Mean R = -15.9  Std R = 6.8  Min R = -38.6
PolicyLoss: -0.0297
Policy_Beta: 0.1
Policy_Entropy: 0.153
Policy_KL: 0.00104
Policy_SD: 0.554
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.74e+07
VF_0_ExplainedVarNew: 0.976
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 0.001


ADV1:  0.0005560087765421352 0.009413813618347757 0.050386930984237355 -0.06380259579510683
ADV2:  0.01667824373655379 0.8663822849667732 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2266   0.6300   3.2939  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0021   5.4889   2.1784   2.1397
**

ADV1:  -0.0016809855331998253 0.008616494020830775 0.0760177530898466 -0.0668577893850833
ADV2:  0.04139988271937682 0.8374563805740338 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1416   1.1491   5.6518  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0044   5.4889   2.1784   2.1397
***** Episode 48893, Mean R = -14.3  Std R = 4.8  Min R = -27.7
PolicyLoss: -0.0308
Policy_Beta: 0.1
Policy_Entropy: 0.152
Policy_KL: 0.000683
Policy_SD: 0.561
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.75e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 7.45e-05


ADV1:  9.630815723195428e-05 0.008532716344386425 0.05108981345058111 -0.10283658949211932
ADV2:  0.02145622231158755 0.82219975348581 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5382   1.4036   7.5736  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0006   5.4889   2.1784   2.1397
**

ADV1:  0.0010652089158382366 0.009266632551151443 0.0573211936570925 -0.05938529737405718
ADV2:  0.010851914351642023 0.8576287207728662 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9023   0.3626   1.6375  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0009   0.0033   5.4889   2.1784   2.1397
***** Episode 49172, Mean R = -14.2  Std R = 7.3  Min R = -31.9
PolicyLoss: -0.0247
Policy_Beta: 0.1
Policy_Entropy: 0.152
Policy_KL: 0.000785
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.76e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.965
VF_0_Loss : 0.000739


ADV1:  -0.002550564152123404 0.009240272998546389 0.044723331638714725 -0.06682504625102208
ADV2:  0.03955411356266275 0.8683694216996233 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6031   0.8775   4.9367  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0019   0.0068   5.4889   2.1784   2.13

***** Episode 49420, Mean R = -14.6  Std R = 5.5  Min R = -31.7
PolicyLoss: -0.0225
Policy_Beta: 0.1
Policy_Entropy: 0.154
Policy_KL: 0.00103
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.77e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.00152


ADV1:  -0.0018210950906355906 0.00879317267952064 0.051655480006340015 -0.05621948080110234
ADV2:  0.0301939534448292 0.8601066258207177 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1206   0.8615   4.0118  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0013   0.0047   5.4889   2.1784   2.1397
***** Episode 49451, Mean R = -14.3  Std R = 6.6  Min R = -33.0
PolicyLoss: -0.0208
Policy_Beta: 0.1
Policy_Entropy: 0.153
Policy_KL: 0.00118
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.77e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 0.00164


ADV1:  0.0028496154836451892 0.007981942829773832 0.11125

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9498   0.5512   2.3333  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0033   5.4889   2.1784   2.1397
***** Episode 49699, Mean R = -13.1  Std R = 4.4  Min R = -22.7
PolicyLoss: -0.0262
Policy_Beta: 0.1
Policy_Entropy: 0.157
Policy_KL: 0.000767
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.78e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.00158


ADV1:  -0.0003022265553297265 0.007521606272586718 0.06763777221386191 -0.06092045299639405
ADV2:  0.008827794760032821 0.8335565540090993 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9476   0.8249   3.4624  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0010   5.4889   2.1784   2.1397
***** Episode 49730, Mean R = -14.5  Std R = 5.2  Min R = -33.8
PolicyLoss: -0.00931
Policy_Beta: 0.1
Policy_Entropy: 0.153
Policy_KL: 0.00075


ADV1:  -0.0011632676942056994 0.008967642138149646 0.07592907264989884 -0.09010128634071182
ADV2:  0.012797287203314349 0.8767846106347508 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1197   0.7906   4.2878  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0036   5.4889   2.1784   2.1397
***** Episode 49978, Mean R = -13.8  Std R = 5.1  Min R = -24.9
PolicyLoss: -0.00667
Policy_Beta: 0.1
Policy_Entropy: 0.155
Policy_KL: 0.000757
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.79e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.963
VF_0_Loss : 9.64e-05


ADV1:  0.00044151445812929026 0.008353478105661784 0.051223353803365984 -0.05852576873659329
ADV2:  0.015220298004255011 0.8743541523027627 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1537   1.2861   5.9181  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0012   5.4889   2.1784  

cs_angles |  0.0005  0.0037 |  0.0780  0.0813 | -0.9872 -0.9998 |  0.9904  0.9989
optical_flow |  0.0002  0.0001 |  0.0265  0.0255 | -0.9069 -1.3386 |  1.0000  1.1500
v_err    | -0.0103 |  0.0580 | -0.4527 |  0.1207
landing_rewards |    9.29 |    2.57 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.06 |    0.04
tracking_rewards |  -18.47 |    4.39 |  -40.70 |  -11.16
steps    |     377 |      21 |     335 |     417
***** Episode 50257, Mean R = -15.5  Std R = 6.5  Min R = -28.0
PolicyLoss: -0.0158
Policy_Beta: 0.1
Policy_Entropy: 0.152
Policy_KL: 0.000913
Policy_SD: 0.563
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.8e+07
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.953
VF_0_Loss : 0.000102


ADV1:  0.0030468632193002706 0.008573272592735858 0.0647231710345576 -0.06782045439088419
ADV2:  -0.011041802725708975 0.8881484905508811 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8091   0.7741   3.6162  24.0260  15.5251  10.0673
ValFun  Gradients: u/

w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03    0.28 |    0.64    1.84 |   -1.37   -3.12 |    1.47    3.11
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.04    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.24 |    0.00 |    1.61
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.98    0.99
cs_angles |  0.0027  0.0035 |  0.0762  0.0855 | -0.9867 -0.9968 |  0.9779  0.9896
optical_flow | -0.0000  0.0000 |  0.0264  0.0260 | -1.1527 -1.2832 |  1.0931  1.3611
v_err    | -0.0104 |  0.0578 | -0.4520 |  0.1625
landing_rewards |    9.23 |    2.67 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.06
tracking_rewards |  -18.47 |    4.65 |  -43.27 |  -10.74
steps    |     376 |  

attitude |    0.00   -0.05    0.19 |    1.24    0.66    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05    0.20 |    0.67    1.84 |   -1.54   -3.14 |    1.40    3.14
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.04 |    0.04    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.50
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -0.97   -0.98 |    0.99    1.00
cs_angles |  0.0015 -0.0017 |  0.0770  0.0810 | -0.9717 -0.9753 |  0.9934  0.9996
optical_flow | -0.0001  0.0001 |  0.0273  0.0253 | -1.3649 -1.1599 |  1.2687  0.9224
v_err    | -0.0105 |  0.0581 | -0.4531 |  0.1257
landing_rewards |    9.35 |    2.46 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.08   -0.03    0.07 |    1.14    0.68    1.83 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04    0.06 |    0.68    1.80 |   -1.43   -3.10 |    1.47    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.02 |    0.04    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.24 |    0.00 |    1.49
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    0.97    0.94
cs_angles |  0.0011  0.0005 |  0.0777  0.0806 | -0.9865 -0.9878 |  0.9707  0.9444
optical_flow |  0.0001  0.0001 |  0.0270  0.0257 | -1.4032 -1.1742 |  1.0141  1.1508
v_err    | -0.0105 |  0.0578 | -0.4533 |  0.1188
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.08    0.00   -0.09 |    1.11    0.68    1.79 |   -3.14   -1.54   -3.14 |    3.14    1.53    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.12 |    0.68    1.80 |   -1.46   -3.14 |    1.50    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.50
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.99    1.00
cs_angles |  0.0040  0.0015 |  0.0779  0.0857 | -0.9936 -0.9952 |  0.9906  0.9981
optical_flow |  0.0001 -0.0001 |  0.0261  0.0263 | -1.0832 -1.4106 |  1.1492  1.2751
v_err    | -0.0106 |  0.0582 | -0.4525 |  0.1141
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04   -0.11 |    0.67    1.88 |   -1.34   -3.12 |    1.54    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.41
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    0.99
cs_angles |  0.0043  0.0026 |  0.0792  0.0840 | -0.9882 -0.9887 |  0.9960  0.9927
optical_flow |  0.0002 -0.0001 |  0.0275  0.0244 | -1.1238 -1.3688 |  1.1374  0.9193
v_err    | -0.0104 |  0.0580 | -0.4531 |  0.1094
landing_rewards |    9.16 |    2.77 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.06 |    0.03
tracking_rewards |  -18.59 |    4.54 |  -45.35 |   -9.57
steps    |     376 |  

w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.00    0.07 |    0.66    1.90 |   -1.44   -3.13 |    1.54    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.04   -0.03 |    0.05    0.02    0.03
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.51
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.97 |    1.00    0.98
cs_angles |  0.0009  0.0037 |  0.0797  0.0808 | -0.9939 -0.9685 |  0.9966  0.9781
optical_flow | -0.0000  0.0001 |  0.0265  0.0256 | -1.0740 -0.9328 |  1.2014  1.1431
v_err    | -0.0100 |  0.0583 | -0.4528 |  0.1068
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -18.44 |    4.48 |  -41.07 |  -10.70
steps    |     378 |  

w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.09 |    0.69    1.82 |   -1.48   -3.14 |    1.52    3.12
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.24 |    0.00 |    1.53
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.97 |    0.97    0.99
cs_angles |  0.0010  0.0026 |  0.0761  0.0818 | -0.9826 -0.9738 |  0.9704  0.9917
optical_flow |  0.0001  0.0000 |  0.0263  0.0246 | -1.3632 -1.1729 |  1.1156  0.9148
v_err    | -0.0101 |  0.0579 | -0.4516 |  0.1069
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -18.34 |    4.34 |  -41.21 |  -11.14
steps    |     378 |  

w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05   -0.08 |    0.59    1.81 |   -1.41   -3.14 |    1.40    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.48
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    0.98
cs_angles |  0.0030  0.0017 |  0.0786  0.0807 | -0.9949 -0.9865 |  0.9975  0.9827
optical_flow | -0.0000  0.0000 |  0.0263  0.0254 | -1.1184 -1.1323 |  0.9948  1.1265
v_err    | -0.0101 |  0.0581 | -0.4527 |  0.1046
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -18.09 |    4.20 |  -35.59 |  -10.43
steps    |     376 |  

attitude |    0.02   -0.03    0.06 |    1.13    0.66    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04    0.03 |    0.67    1.80 |   -1.46   -3.11 |    1.53    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.24 |    0.00 |    1.56
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -0.97 |    1.00    0.98
cs_angles |  0.0025  0.0012 |  0.0746  0.0810 | -0.9982 -0.9713 |  0.9964  0.9838
optical_flow |  0.0002  0.0000 |  0.0263  0.0244 | -1.3860 -1.1112 |  1.0656  1.1004
v_err    | -0.0102 |  0.0584 | -0.4526 |  0.1072
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.01    0.02   -0.02 |    1.14    0.64    1.92 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.07 |    0.62    1.91 |   -1.48   -3.14 |    1.40    3.10
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.66
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    0.98    0.99
cs_angles |  0.0033  0.0008 |  0.0804  0.0818 | -0.9925 -0.9949 |  0.9844  0.9864
optical_flow |  0.0000  0.0001 |  0.0254  0.0243 | -1.1820 -0.9779 |  1.2824  1.2288
v_err    | -0.0100 |  0.0584 | -0.4533 |  0.1188
landing_rewards |    9.19 |    2.72 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.05   -0.01   -0.10 |    1.16    0.66    1.79 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02   -0.07 |    0.67    1.79 |   -1.48   -3.14 |    1.53    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.24 |    0.00 |    1.64
seeker_angles |    0.01    0.00 |    0.08    0.08 |   -0.99   -0.97 |    1.00    1.00
cs_angles |  0.0053  0.0033 |  0.0758  0.0800 | -0.9919 -0.9675 |  0.9952  0.9986
optical_flow |  0.0002 -0.0000 |  0.0264  0.0247 | -1.2631 -0.9817 |  1.0896  1.0118
v_err    | -0.0100 |  0.0579 | -0.4520 |  0.1117
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.02   -0.06   -0.12 |    1.23    0.70    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04   -0.11 |    0.70    1.90 |   -1.39   -3.13 |    1.44    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.63
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -1.00 |    0.98    0.97
cs_angles |  0.0027  0.0008 |  0.0787  0.0819 | -0.9797 -0.9959 |  0.9821  0.9664
optical_flow |  0.0001  0.0000 |  0.0262  0.0254 | -1.2543 -1.1012 |  1.2537  1.0998
v_err    | -0.0104 |  0.0578 | -0.4511 |  0.1123
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.01   -0.01    0.00 |    0.68    0.68    0.67 |   -3.45   -3.46   -3.38 |    3.41    3.36    3.46
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.55 |    0.19 |    1.04 |    2.30
rewards  |  -13.02 |    4.31 |  -29.28 |   -4.84
fuel_rewards |   -4.45 |    0.55 |   -6.61 |   -2.98
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.99 |   12.45 |    0.01 |  273.75
norm_af  |    1.74 |    0.94 |    0.07 |    3.26
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.03    0.02    0.15 |    1.17    0.65    1.86 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03    0.09 |    0.65

ADV1:  -0.0004084007270655154 0.0087245551476951 0.05237973939913021 -0.08956406925893948
ADV2:  0.025618757800311084 0.8320607999261104 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0127   0.8869   4.5267  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0008   0.0034   5.4889   2.1784   2.1397
Update Cnt = 1760    ET =   1062.4   Stats:  Mean, Std, Min, Max
r_f      |    2.99   -3.85    6.39 |  190.26  176.80  195.46 | -381.66 -381.33 -369.99 |  397.69  390.60  397.63
v_f      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.08 |    0.09    0.10    0.10
r_i      |    6.07  -28.65    8.92 |  689.96  682.86  748.12 |-1293.10-1339.72-1324.20 | 1322.71 1297.03 1393.32
v_i      |    0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.10 |    0.09    0.09    0.09
norm_rf  |    0.22 |    0.09 |    0.06 |    0.54
norm_vf  |    0.07 |    0.01 |    0.03 |    0.11
gs_f     |    1.21 |    1.71 |   

***** Episode 54845, Mean R = -13.4  Std R = 4.9  Min R = -33.2
PolicyLoss: -0.0146
Policy_Beta: 0.1
Policy_Entropy: 0.153
Policy_KL: 0.00105
Policy_SD: 0.551
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.97e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.000305


ADV1:  -0.001362791201970603 0.008112642117959234 0.04581951295146841 -0.058430805104567586
ADV2:  0.038136647515337914 0.8442906454658824 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6480   0.8411   4.7184  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0035   5.4889   2.1784   2.1397
***** Episode 54876, Mean R = -14.1  Std R = 5.4  Min R = -23.6
PolicyLoss: -0.0303
Policy_Beta: 0.1
Policy_Entropy: 0.158
Policy_KL: 0.00109
Policy_SD: 0.545
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.97e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.000795


ADV1:  0.0016236127289664516 0.007746006920514591 0.

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1574   1.8742   9.9738  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0031   5.4889   2.1784   2.1397
***** Episode 55124, Mean R = -13.0  Std R = 5.8  Min R = -32.9
PolicyLoss: -0.00495
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.000706
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.98e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.000397


ADV1:  -0.003694174776689386 0.010900741279188976 0.0552388788167304 -0.07944637865819254
ADV2:  0.040900479386846364 0.8930461228104394 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5759   0.8358   4.4589  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0043   0.0026   0.0096   5.4889   2.1784   2.1397
***** Episode 55155, Mean R = -14.4  Std R = 7.1  Min R = -32.0
PolicyLoss: -0.0201
Policy_Beta: 0.1
Policy_Entropy: 0.16
Policy_KL: 0.000753
Pol

ADV1:  -7.184897437576271e-05 0.007442817392834276 0.04846667067985372 -0.07842883103630022
ADV2:  0.02200858818734684 0.8069338604627779 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3979   1.0088   4.5790  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0019   5.4889   2.1784   2.1397
***** Episode 55403, Mean R = -13.0  Std R = 5.9  Min R = -31.1
PolicyLoss: -0.0254
Policy_Beta: 0.1
Policy_Entropy: 0.158
Policy_KL: 0.000738
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.99e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.000144


ADV1:  -0.0006620036523537222 0.01018083312575119 0.10104857484499619 -0.08439542896646512
ADV2:  0.024598069946379482 0.8736344446091849 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6511   1.5975   7.9934  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0017   5.4889   2.1784   2.1

ADV1:  -0.0034869902980736206 0.010409130334237708 0.05025594006382231 -0.06590703497530481
ADV2:  0.04478175960075253 0.8767627864258363 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9511   1.4490   6.1043  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0039   0.0023   0.0090   5.4889   2.1784   2.1397
***** Episode 55682, Mean R = -16.0  Std R = 7.5  Min R = -34.9
PolicyLoss: -0.0254
Policy_Beta: 0.1
Policy_Entropy: 0.156
Policy_KL: 0.000984
Policy_SD: 0.565
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2e+07
VF_0_ExplainedVarNew: 0.963
VF_0_ExplainedVarOld: 0.96
VF_0_Loss : 0.000102


ADV1:  0.001703317701346705 0.007394037362215993 0.06889311362927814 -0.06925456769740684
ADV2:  0.00133261244314452 0.8464206061741449 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8261   0.9055   3.5645  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0011   0.0045   5.4889   2.1784   2.1397
**

ADV1:  -0.0001807032410897458 0.007957914273948615 0.050914848522415235 -0.055463291299093255
ADV2:  0.02590123901600083 0.8366541562365325 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8004   0.9781   5.4150  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0008   5.4889   2.1784   2.1397
***** Episode 55961, Mean R = -12.1  Std R = 4.4  Min R = -27.1
PolicyLoss: -0.0285
Policy_Beta: 0.1
Policy_Entropy: 0.158
Policy_KL: 0.000722
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.01e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 6.41e-05


ADV1:  0.0012870931487299077 0.008749934881522104 0.051552251326375614 -0.07771853142760354
ADV2:  0.012080067310194164 0.8446354673795531 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4155   0.5038   2.7719  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0010   0.0040   5.4889   2.1784   2

ADV1:  0.0015989298467824517 0.007250573904724729 0.0411024418687953 -0.05849818191341531
ADV2:  0.0015324528605404116 0.8744128487241999 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9525   1.3116   7.0210  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0012   0.0044   5.4889   2.1784   2.1397
***** Episode 56240, Mean R = -13.1  Std R = 5.2  Min R = -27.1
PolicyLoss: -0.0197
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.00092
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.02e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.000675


ADV1:  0.00020296583686933833 0.007844962427567211 0.05148769097116254 -0.05156935359285862
ADV2:  0.019247489132162142 0.8510022592010664 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3154   0.9291   4.6667  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0022   5.4889   2.1784   2.1

***** Episode 56488, Mean R = -15.0  Std R = 5.9  Min R = -31.8
PolicyLoss: -0.0166
Policy_Beta: 0.1
Policy_Entropy: 0.158
Policy_KL: 0.00117
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.03e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.000241


ADV1:  0.0009571572396272482 0.007563947380281576 0.06543551489554994 -0.07495904781666513
ADV2:  0.009736071110430356 0.8603306233477134 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1489   2.2440   9.5340  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0025   5.4889   2.1784   2.1397
***** Episode 56519, Mean R = -12.9  Std R = 5.0  Min R = -28.3
PolicyLoss: -0.0222
Policy_Beta: 0.1
Policy_Entropy: 0.16
Policy_KL: 0.000754
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.03e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.000976


ADV1:  -0.00014437103115649152 0.008785855080375734 0

***** Episode 56767, Mean R = -13.6  Std R = 5.2  Min R = -29.3
PolicyLoss: -0.00428
Policy_Beta: 0.1
Policy_Entropy: 0.16
Policy_KL: 0.000748
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.04e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.000352


ADV1:  -0.0002057825610737665 0.005649216495265638 0.0449273198933926 -0.03173499594288959
ADV2:  -0.007520268928021556 0.8685344510992394 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1893   1.7241   8.9514  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0021   5.4889   2.1784   2.1397
***** Episode 56798, Mean R = -11.1  Std R = 4.1  Min R = -22.6
PolicyLoss: 0.00767
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.00105
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.04e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 3.42e-05


ADV1:  -0.0027397156983126163 0.005757264303846425 

seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.97   -0.99 |    0.99    1.00
cs_angles |  0.0034  0.0006 |  0.0743  0.0817 | -0.9750 -0.9915 |  0.9929  0.9950
optical_flow |  0.0002  0.0001 |  0.0264  0.0249 | -1.1042 -1.1700 |  1.3503  1.0753
v_err    | -0.0096 |  0.0581 | -0.4527 |  0.1154
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.02
tracking_rewards |  -17.79 |    4.15 |  -35.00 |  -10.17
steps    |     376 |      21 |     328 |     415
***** Episode 57077, Mean R = -13.9  Std R = 5.7  Min R = -31.8
PolicyLoss: -0.0206
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.000924
Policy_SD: 0.563
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.06e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.000311


ADV1:  -0.0019287693669840806 0.009171348885190536 0.04492522152851969 -0.06820098543864977
ADV2:  0.037698240537725435 0.8625398477153575 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Ma

attitude |    0.07    0.03    0.04 |    1.15    0.68    1.84 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.02 |    0.68    1.84 |   -1.48   -3.13 |    1.49    3.11
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.04
w_rewards |   -0.00 |    0.00 |   -0.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.24 |    0.00 |    1.98
seeker_angles |    0.01    0.01 |    0.08    0.08 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0063  0.0055 |  0.0764  0.0792 | -0.9976 -0.9933 |  0.9984  0.9946
optical_flow |  0.0001  0.0000 |  0.0258  0.0238 | -1.2500 -1.2324 |  1.1971  1.2009
v_err    | -0.0097 |  0.0583 | -0.4522 |  0.1143
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.07   -0.05    0.01 |    1.27    0.69    1.88 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04    0.10 |    0.68    1.89 |   -1.47   -3.12 |    1.52    3.09
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.47
seeker_angles |    0.01    0.00 |    0.08    0.08 |   -1.00   -0.97 |    1.00    1.00
cs_angles |  0.0055  0.0026 |  0.0798  0.0814 | -0.9962 -0.9691 |  0.9995  0.9969
optical_flow | -0.0000 -0.0001 |  0.0271  0.0241 | -1.1922 -1.1396 |  1.2907  1.0826
v_err    | -0.0100 |  0.0587 | -0.4522 |  0.1030
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00   -0.00   -0.01 |    0.67    0.67    0.68 |   -3.44   -3.39   -3.44 |    3.41    3.42    3.45
norm_thrust |    0.89 |    0.76 |    0.00 |    3.46
fuel     |    1.53 |    0.19 |    1.07 |    2.10
rewards  |  -12.76 |    5.11 |  -36.50 |   -4.30
fuel_rewards |   -4.38 |    0.54 |   -6.01 |   -3.10
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.15 |   13.14 |    0.01 |  926.66
norm_af  |    1.71 |    0.96 |    0.10 |    3.31
norm_wf  |    0.02 |    0.01 |    0.00 |    0.06
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.06    0.03   -0.13 |    1.20    0.66    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.13 |    0.66

ADV1:  0.0010957773098910308 0.009790661118831201 0.04134083003229333 -0.06178836762905121
ADV2:  0.014530324580982518 0.8697963108114606 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7762   0.7522   3.1481  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0031   5.4889   2.1784   2.1397
Update Cnt = 1880    ET =   1142.7   Stats:  Mean, Std, Min, Max
r_f      |  -16.77   -1.19   -6.31 |  187.20  166.95  200.85 | -383.72 -392.31 -385.44 |  378.30  376.70  394.34
v_f      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.10 |    0.10    0.08    0.10
r_i      |  -65.53   13.93  -41.97 |  702.45  633.97  765.56 |-1288.02-1267.59-1307.43 | 1328.16 1278.13 1362.56
v_i      |    0.01   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.09    0.09
norm_rf  |    0.22 |    0.09 |    0.04 |    0.51
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.44 |    2.75 |  

ADV1:  0.0012162263087314186 0.006152797498501879 0.04897054582341315 -0.07216663935588596
ADV2:  -0.0013222369965923855 0.8968018395199462 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8069   0.7765   3.9638  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0032   5.4889   2.1784   2.1397
***** Episode 58596, Mean R = -12.2  Std R = 6.8  Min R = -42.0
PolicyLoss: -0.0148
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.00078
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.11e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.00087


ADV1:  0.00201370584430751 0.006510184067544438 0.056153591638673284 -0.05432628921590099
ADV2:  -0.004810342285552436 0.8872621387938704 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2279   2.0360  10.6866  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0017   0.0059   5.4889   2.1784   2.1

ADV1:  0.00044352863475398294 0.007460568159205675 0.048470187778031026 -0.06564101930853761
ADV2:  0.017169318410830997 0.836569730848862 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0178   0.5535   3.1644  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   5.4889   2.1784   2.1397
***** Episode 58875, Mean R = -10.9  Std R = 4.4  Min R = -23.1
PolicyLoss: -0.0259
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.000953
Policy_SD: 0.519
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.12e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.000226


ADV1:  0.000595685513247942 0.007442208419084736 0.04425629159262906 -0.0655009464308296
ADV2:  0.01203766147221281 0.8541718004341597 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4199   0.8010   4.2550  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0017   5.4889   2.1784   2.1397

ADV1:  -0.0020952902329566666 0.006996221588446692 0.04745951618087271 -0.0774514924223415
ADV2:  0.04942231313701534 0.819675482845497 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7796   0.9262   3.5917  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0054   5.4889   2.1784   2.1397
***** Episode 59154, Mean R = -12.9  Std R = 4.6  Min R = -23.5
PolicyLoss: -0.0308
Policy_Beta: 0.1
Policy_Entropy: 0.163
Policy_KL: 0.000587
Policy_SD: 0.532
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.13e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.000396


ADV1:  0.0016662016140097575 0.006559102002644554 0.04983141819765324 -0.05581692895641788
ADV2:  0.0010409506167669562 0.8257027454712427 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0926   0.8757   4.5684  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0011   0.0043   5.4889   2.1784   2.139

ADV1:  0.004251631580467108 0.006391589102312281 0.05628129853867725 -0.064128734934359
ADV2:  -0.027389028437254343 0.8890988955706158 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0798   0.8234   4.3939  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0049   0.0031   0.0109   5.4889   2.1784   2.1397
***** Episode 59433, Mean R = -12.0  Std R = 4.6  Min R = -22.4
PolicyLoss: -0.0138
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.00072
Policy_SD: 0.514
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.14e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 6.98e-05


ADV1:  -0.00259932887571893 0.006656015553529072 0.037072380422071255 -0.056009081800794454
ADV2:  0.05683975540326759 0.8182817708361856 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5648   0.6728   4.1479  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0018   0.0068   5.4889   2.1784   2.1397


ADV1:  0.002761324709879955 0.007102063165050547 0.052775702023565296 -0.04727711811940319
ADV2:  -0.011181581892261011 0.8670524228598199 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1918   0.7365   3.6185  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0034   0.0020   0.0074   5.4889   2.1784   2.1397
***** Episode 59712, Mean R = -13.6  Std R = 5.4  Min R = -28.0
PolicyLoss: -0.0151
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.000773
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.15e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 8.75e-05


ADV1:  -1.0065881895164377e-05 0.007730042207834103 0.03750546469502125 -0.08485976321400635
ADV2:  0.02686146405337769 0.8254694611043155 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6944   0.6797   3.3799  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0026   5.4889   2.1784   2

***** Episode 59960, Mean R = -14.1  Std R = 4.7  Min R = -27.9
PolicyLoss: -0.0314
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.000921
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.16e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.000573


ADV1:  0.0036700244896319596 0.00743094073458218 0.05521813046898083 -0.07029531559519615
ADV2:  -0.01354670794643771 0.8471861827541692 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3437   0.7139   2.8693  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0040   0.0025   0.0095   5.4889   2.1784   2.1397
***** Episode 59991, Mean R = -12.6  Std R = 5.7  Min R = -30.3
PolicyLoss: -0.0244
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.000734
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.17e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.000417


ADV1:  -0.0019170967662438766 0.007804170150465962 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0553   1.5607   7.5327  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0017   5.4889   2.1784   2.1397
***** Episode 60239, Mean R = -13.4  Std R = 6.5  Min R = -31.0
PolicyLoss: -0.0218
Policy_Beta: 0.1
Policy_Entropy: 0.164
Policy_KL: 0.000783
Policy_SD: 0.53
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.17e+07
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.954
VF_0_Loss : 0.000183


ADV1:  0.0008536551235217428 0.006418281865304137 0.03607366456820396 -0.049894627395294766
ADV2:  -0.0038505288271736163 0.9123477049218153 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1301   1.3895   8.2243  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0024   5.4889   2.1784   2.1397
***** Episode 60270, Mean R = -12.4  Std R = 4.5  Min R = -26.3
PolicyLoss: -0.00953
Policy_Beta: 0.1
Policy_Entropy: 0.163
Policy_KL: 0.001
P

ADV1:  -0.0006579997384557488 0.0054134142321334905 0.0437686478492155 -0.060249213360973275
ADV2:  0.006146293969875334 0.8901237613130889 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.6678   2.8266  12.2087  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0005   0.0017   5.4889   2.1784   2.1397
***** Episode 60518, Mean R = -12.0  Std R = 4.8  Min R = -25.6
PolicyLoss: -0.000701
Policy_Beta: 0.0667
Policy_Entropy: 0.162
Policy_KL: 0.00208
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.19e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.000462


ADV1:  -0.001337753329640619 0.007840795166907631 0.0517673540583502 -0.06413992652616392
ADV2:  0.03528404274581456 0.8152281356990784 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.3517   2.0125   9.5249  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0035   5.4889   2.1784  

cs_angles |  0.0005  0.0000 |  0.0772  0.0819 | -0.9462 -0.9937 |  0.9770  0.9806
optical_flow |  0.0001  0.0001 |  0.0253  0.0242 | -1.0431 -1.1061 |  1.4629  1.0576
v_err    | -0.0102 |  0.0577 | -0.4528 |  0.1072
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.03
tracking_rewards |  -18.07 |    4.04 |  -31.15 |  -10.57
steps    |     379 |      21 |     332 |     419
***** Episode 60797, Mean R = -14.8  Std R = 5.7  Min R = -27.2
PolicyLoss: -0.0232
Policy_Beta: 0.1
Policy_Entropy: 0.163
Policy_KL: 0.000787
Policy_SD: 0.557
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.2e+07
VF_0_ExplainedVarNew: 0.967
VF_0_ExplainedVarOld: 0.96
VF_0_Loss : 0.000109


ADV1:  0.0010022820506060753 0.007057150181240395 0.056616236116549895 -0.07450763348446482
ADV2:  0.009279944111559022 0.8477751591480914 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9737   1.9256   8.4398  24.0260  15.5251  10.0673
ValFun  Gradients: u

attitude |    0.08    0.04    0.05 |    1.22    0.62    1.95 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.08 |    0.63    1.95 |   -1.51   -3.14 |    1.46    3.12
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.58
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -1.00 |    1.00    0.99
cs_angles |  0.0006  0.0016 |  0.0750  0.0820 | -0.9971 -0.9988 |  0.9992  0.9937
optical_flow | -0.0001 -0.0002 |  0.0261  0.0248 | -1.2367 -1.2111 |  1.1197  0.9112
v_err    | -0.0098 |  0.0576 | -0.4523 |  0.1075
landing_rewards |    9.26 |    2.62 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.06   -0.02    0.02 |    1.27    0.63    1.89 |   -3.14   -1.50   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03    0.04 |    0.64    1.90 |   -1.50   -3.14 |    1.42    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.24 |    0.00 |    1.53
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.96   -0.99 |    1.00    1.00
cs_angles |  0.0012  0.0003 |  0.0784  0.0778 | -0.9626 -0.9870 |  0.9997  0.9956
optical_flow |  0.0002  0.0000 |  0.0264  0.0262 | -1.0305 -1.2339 |  1.4412  1.2606
v_err    | -0.0098 |  0.0576 | -0.4533 |  0.1013
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.13   -0.05    0.02 |    1.27    0.68    1.97 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05    0.05 |    0.67    1.98 |   -1.54   -3.13 |    1.46    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.50
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.97   -0.97 |    0.98    0.99
cs_angles |  0.0026  0.0017 |  0.0796  0.0772 | -0.9749 -0.9661 |  0.9753  0.9885
optical_flow |  0.0001  0.0001 |  0.0265  0.0256 | -1.2109 -1.1437 |  1.0463  1.0238
v_err    | -0.0097 |  0.0579 | -0.4543 |  0.1105
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.00    0.00 |    0.67    0.69    0.68 |   -3.29   -3.46   -3.42 |    3.46    3.42    3.41
norm_thrust |    0.89 |    0.76 |    0.00 |    3.46
fuel     |    1.52 |    0.17 |    1.10 |    2.07
rewards  |  -12.33 |    4.64 |  -27.63 |   -4.32
fuel_rewards |   -4.37 |    0.50 |   -5.93 |   -3.14
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.01 |   13.04 |    0.01 |  472.62
norm_af  |    1.73 |    0.89 |    0.04 |    3.28
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.03   -0.02    0.20 |    1.08    0.60    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.45    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.15 |    0.60

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9446   1.3317   6.0721  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0019   0.0074   5.4889   2.1784   2.1397
Update Cnt = 2010    ET =   1055.6   Stats:  Mean, Std, Min, Max
r_f      |    0.44  -22.32   33.92 |  182.66  177.40  197.23 | -394.05 -389.81 -384.99 |  396.19  368.21  381.10
v_f      |   -0.00    0.01   -0.01 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.10 |    0.10    0.09    0.11
r_i      |   11.76 -100.94  151.80 |  679.02  684.87  731.14 |-1357.64-1273.71-1325.43 | 1328.19 1271.35 1340.74
v_i      |    0.00    0.01   -0.01 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.10    0.09    0.08
norm_rf  |    0.21 |    0.08 |    0.02 |    0.46
norm_vf  |    0.07 |    0.01 |    0.05 |    0.11
gs_f     |    1.18 |    1.91 |    0.01 |   23.38
thrust   |   -0.00   -0.00    0.00 |    0.67    0.68    0.68 |   -3.36   -3.46   -3.45 |    3.46    3.46    3.46
norm_thrust |    

ADV1:  0.0005359694679531429 0.005881021562528303 0.04923404912625462 -0.05006844130544469
ADV2:  -0.00043210331397057126 0.8833939052771457 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3693   0.4289   2.2094  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0016   5.4889   2.1784   2.1397
***** Episode 62626, Mean R = -11.6  Std R = 5.4  Min R = -34.5
PolicyLoss: -0.00824
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000955
Policy_SD: 0.519
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.26e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.000501


ADV1:  0.0005087687962033091 0.007481976869958941 0.04431280621104133 -0.07071150564619859
ADV2:  0.01686351539714125 0.8357564338153327 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.5117   2.4458   9.6188  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0005   0.0017   5.4889   2.1784   

***** Episode 62874, Mean R = -13.8  Std R = 4.5  Min R = -28.4
PolicyLoss: -0.0245
Policy_Beta: 0.1
Policy_Entropy: 0.164
Policy_KL: 0.000898
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.27e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.00015


ADV1:  0.0014607135260090564 0.007388014090289669 0.050892377175168535 -0.09132746900921523
ADV2:  0.0012353762926076367 0.8549124490786991 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0931   2.0288  10.0673  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0042   5.4889   2.1784   2.1397
***** Episode 62905, Mean R = -11.3  Std R = 4.7  Min R = -23.1
PolicyLoss: -0.0217
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000953
Policy_SD: 0.533
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.28e+07
VF_0_ExplainedVarNew: 0.976
VF_0_ExplainedVarOld: 0.971
VF_0_Loss : 9.98e-05


ADV1:  -0.002198473183512077 0.006961659688806255 

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7130   1.0222   4.4589  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0021   5.4889   2.1784   2.1397
***** Episode 63153, Mean R = -11.7  Std R = 4.1  Min R = -21.9
PolicyLoss: -0.0308
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000745
Policy_SD: 0.536
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.28e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.000854


ADV1:  -0.00016995433376491885 0.007469500620297383 0.037190998586646096 -0.08100019383947066
ADV2:  0.030133730854040395 0.8150681359434749 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6081   1.8277   9.1381  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   5.4889   2.1784   2.1397
***** Episode 63184, Mean R = -13.9  Std R = 6.4  Min R = -33.0
PolicyLoss: -0.0335
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.0008

ADV1:  -0.000970818161184674 0.00961592080355124 0.05032997360674418 -0.05669817607037639
ADV2:  0.0225562380371038 0.8976193055739198 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3561   1.4049   5.9029  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0009   0.0030   5.4889   2.1784   2.1397
***** Episode 63432, Mean R = -13.6  Std R = 5.0  Min R = -30.7
PolicyLoss: -0.0204
Policy_Beta: 0.1
Policy_Entropy: 0.167
Policy_KL: 0.00104
Policy_SD: 0.529
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.29e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.958
VF_0_Loss : 0.000251


ADV1:  0.001864643162829119 0.007545375663028884 0.06319265576463035 -0.11154836597099393
ADV2:  0.004188177691321827 0.8163395371337078 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2213   1.0624   5.4615  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0048   5.4889   2.1784   2.1397
*

ADV1:  -0.0016524261552564284 0.005969344267591643 0.0633907032078751 -0.06479622553525138
ADV2:  0.027118254636038057 0.8757050781890476 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9210   1.2093   6.0238  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0012   0.0044   5.4889   2.1784   2.1397
***** Episode 63711, Mean R = -13.0  Std R = 3.8  Min R = -25.2
PolicyLoss: -0.0106
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000941
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.31e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 6.01e-05


ADV1:  -0.0003978664347738143 0.007184826580291469 0.048405198148704254 -0.06879727804912439
ADV2:  0.024025434889306665 0.8103467976857975 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3016   0.4025   2.2618  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0012   5.4889   2.1784   2

ADV1:  0.0006169629203978132 0.0059303974224568946 0.04716978119355575 -0.06158537280870485
ADV2:  -0.001103029207030664 0.8871525552306081 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0178   1.2077   4.8347  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0017   5.4889   2.1784   2.1397
***** Episode 63990, Mean R = -12.3  Std R = 3.5  Min R = -22.2
PolicyLoss: -0.0102
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.00117
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.32e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.000342


ADV1:  -0.0010574026802976668 0.007185376728355806 0.03635867848110613 -0.08461626545125672
ADV2:  0.03477043764398706 0.8463377015342136 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1208   1.1463   5.5494  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0028   5.4889   2.1784   2.

ADV1:  0.003502107099931967 0.009429197026452188 0.05006604098964823 -0.07044854345418838
ADV2:  -0.004896796518509025 0.8725902510106032 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4125   1.0004   5.3940  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0039   0.0025   0.0091   5.4889   2.1784   2.1397
***** Episode 64269, Mean R = -12.1  Std R = 5.7  Min R = -28.4
PolicyLoss: -0.0255
Policy_Beta: 0.1
Policy_Entropy: 0.163
Policy_KL: 0.000907
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.33e+07
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.955
VF_0_Loss : 8.67e-05


ADV1:  -0.0015125747999504874 0.00650329665694524 0.03328250790007923 -0.11973350126805676
ADV2:  0.03659634021516667 0.7965163866107128 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6585   0.2700   1.4139  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0011   0.0038   5.4889   2.1784   2.139

ADV1:  0.002190463632735642 0.007963264236410392 0.07643577042903987 -0.07235385748375056
ADV2:  -0.01601432998935349 0.7995385152057727 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3375   0.7737   4.1488  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0034   0.0019   0.0065   5.4889   2.1784   2.1397
***** Episode 64548, Mean R = -13.2  Std R = 5.4  Min R = -28.6
PolicyLoss: -0.00696
Policy_Beta: 0.1
Policy_Entropy: 0.164
Policy_KL: 0.000866
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.2e+04
TotalSteps: 2.34e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.00122


ADV1:  -0.0015945159373396418 0.007135144762740113 0.08721920521584564 -0.061954718777754936
ADV2:  0.03362477056361225 0.8361569808103 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7976   0.9766   4.9729  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0015   0.0053   5.4889   2.1784   2.1397
*

seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.96   -0.96 |    1.00    1.00
cs_angles |  0.0021  0.0000 |  0.0767  0.0827 | -0.9614 -0.9588 |  0.9951  0.9961
optical_flow | -0.0000  0.0002 |  0.0258  0.0238 | -1.1351 -1.2121 |  1.2039  1.0590
v_err    | -0.0097 |  0.0580 | -0.4527 |  0.1058
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -17.77 |    4.39 |  -33.79 |  -10.89
steps    |     378 |      19 |     335 |     420
***** Episode 64827, Mean R = -10.9  Std R = 4.3  Min R = -23.6
PolicyLoss: -0.0201
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.00114
Policy_SD: 0.527
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.35e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 3.25e-05


ADV1:  -0.0018314055544847382 0.008212353268882231 0.03443905177498946 -0.08360422231593506
ADV2:  0.05026804924604923 0.8017294981115504 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max

attitude |   -0.03   -0.01    0.02 |    1.17    0.67    1.75 |   -3.14   -1.52   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01    0.05 |    0.67    1.75 |   -1.52   -3.13 |    1.43    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.26 |    0.00 |    1.55
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.96 |    0.99    0.97
cs_angles |  0.0024  0.0026 |  0.0754  0.0830 | -0.9861 -0.9638 |  0.9911  0.9702
optical_flow |  0.0000 -0.0000 |  0.0250  0.0222 | -1.0398 -1.1705 |  1.2914  1.1405
v_err    | -0.0101 |  0.0579 | -0.4522 |  0.1104
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.10   -0.02   -0.10 |    1.25    0.68    1.95 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02   -0.10 |    0.68    1.97 |   -1.43   -3.14 |    1.52    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.49
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    0.98
cs_angles |  0.0000  0.0024 |  0.0762  0.0779 | -0.9930 -0.9921 |  0.9982  0.9844
optical_flow |  0.0001 -0.0001 |  0.0244  0.0227 | -1.0352 -1.2856 |  1.2176  1.3001
v_err    | -0.0099 |  0.0575 | -0.4514 |  0.1072
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.01    0.02   -0.13 |    1.27    0.66    1.91 |   -3.14   -1.51   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.21 |    0.67    1.91 |   -1.42   -3.14 |    1.51    3.11
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.04 |    0.04    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.26 |    0.00 |    1.62
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.98 |    0.98    1.00
cs_angles |  0.0036  0.0014 |  0.0776  0.0805 | -0.9989 -0.9776 |  0.9807  0.9959
optical_flow |  0.0001  0.0001 |  0.0255  0.0247 | -1.0858 -1.0607 |  1.2186  1.1075
v_err    | -0.0100 |  0.0576 | -0.4530 |  0.1047
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

rewards  |  -12.03 |    5.53 |  -53.38 |   -4.11
fuel_rewards |   -4.39 |    0.57 |   -6.30 |   -2.99
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.03 |   12.83 |    0.01 |  998.12
norm_af  |    1.74 |    0.95 |    0.03 |    3.32
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.05    0.00    0.20 |    1.20    0.61    1.87 |   -3.14   -1.51   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.16 |    0.62    1.87 |   -1.28   -3.14 |    1.46    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_pena

Update Cnt = 2140    ET =   1085.1   Stats:  Mean, Std, Min, Max
r_f      |    0.31    3.08   -7.81 |  190.60  181.41  192.84 | -379.62 -383.90 -369.60 |  387.67  368.48  379.78
v_f      |   -0.00    0.00   -0.00 |    0.04    0.04    0.04 |   -0.09   -0.08   -0.09 |    0.12    0.08    0.10
r_i      |   -4.39   18.16   -7.40 |  701.80  682.91  731.40 |-1307.41-1353.67-1311.06 | 1355.18 1252.20 1214.09
v_i      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.08 |    0.09    0.09    0.10
norm_rf  |    0.21 |    0.09 |    0.03 |    0.56
norm_vf  |    0.07 |    0.01 |    0.05 |    0.12
gs_f     |    1.16 |    1.68 |    0.01 |   14.95
thrust   |    0.00    0.00   -0.00 |    0.68    0.68    0.67 |   -3.45   -3.46   -3.38 |    3.39    3.35    3.46
norm_thrust |    0.89 |    0.76 |    0.00 |    3.46
fuel     |    1.54 |    0.18 |    1.01 |    2.06
rewards  |  -12.27 |    4.69 |  -28.00 |   -3.29
fuel_rewards |   -4.42 |    0.53 |   -5.90 |   -2.90
glideslope_rewards |

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6981   1.8466   7.2447  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0008   5.4889   2.1784   2.1397
***** Episode 66656, Mean R = -12.7  Std R = 4.5  Min R = -24.4
PolicyLoss: -0.0259
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.000746
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.42e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 4.27e-05


ADV1:  0.0012165660178306058 0.007292130108696572 0.05759514747771771 -0.07091248322453256
ADV2:  0.014178482902141269 0.792511731091374 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6869   0.8983   5.0708  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0031   5.4889   2.1784   2.1397
Update Cnt = 2150    ET =   1104.2   Stats:  Mean, Std, Min, Max
r_f      |    8.23   -2.84    3.50 |  176.87  169.74  203.98 | -364.61 -351.70 -

ADV1:  0.0014873594832730981 0.0054891348572469285 0.043116637797085244 -0.03462530604735614
ADV2:  -0.018499422394288364 0.928186640039164 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7140   1.7576   8.2414  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0043   5.4889   2.1784   2.1397
***** Episode 66935, Mean R = -12.8  Std R = 4.8  Min R = -25.3
PolicyLoss: -0.00202
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.000979
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.43e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 6.55e-05


ADV1:  -0.002843014921088994 0.010215635298832735 0.030567354711018346 -0.07445864304922853
ADV2:  0.04210901519366464 0.8744964693095225 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7916   1.0639   5.6198  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0019   0.0074   5.4889   2.1784   2

***** Episode 67183, Mean R = -10.9  Std R = 4.3  Min R = -22.4
PolicyLoss: 0.00533
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.000901
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.44e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 3.22e-05


ADV1:  -0.000496524413178047 0.005434197063494022 0.03551446141688386 -0.08640946337510325
ADV2:  0.013992813587599908 0.8700601556545888 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5792   0.8491   3.9388  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0013   5.4889   2.1784   2.1397
***** Episode 67214, Mean R = -11.6  Std R = 4.4  Min R = -27.0
PolicyLoss: -0.0113
Policy_Beta: 0.1
Policy_Entropy: 0.169
Policy_KL: 0.000895
Policy_SD: 0.529
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.44e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.000112


ADV1:  -0.0009704398461724688 0.008619069323921131 

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2033   1.3160   4.6750  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0008   0.0030   5.4889   2.1784   2.1397
***** Episode 67462, Mean R = -12.8  Std R = 5.2  Min R = -28.3
PolicyLoss: -0.0303
Policy_Beta: 0.1
Policy_Entropy: 0.167
Policy_KL: 0.000889
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.45e+07
VF_0_ExplainedVarNew: 0.962
VF_0_ExplainedVarOld: 0.956
VF_0_Loss : 9.87e-05


ADV1:  0.0005976000751331149 0.006467556492084798 0.04112085880819272 -0.057821604621258404
ADV2:  0.01234617928348401 0.8477176484550362 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.6451   3.1285  12.7479  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0018   5.4889   2.1784   2.1397
***** Episode 67493, Mean R = -12.1  Std R = 3.2  Min R = -18.9
PolicyLoss: -0.0245
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000975


ADV1:  -0.0023340458267666763 0.007454874984232071 0.047565800843370476 -0.06150323773728374
ADV2:  0.042067683700630534 0.8432634342615328 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1739   0.4352   2.1430  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0015   0.0061   5.4889   2.1784   2.1397
***** Episode 67741, Mean R = -12.6  Std R = 4.8  Min R = -28.0
PolicyLoss: -0.0245
Policy_Beta: 0.1
Policy_Entropy: 0.167
Policy_KL: 0.000832
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.46e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.000215


ADV1:  -0.0011193522503104437 0.005615606795125381 0.0591654579715567 -0.08572766978417029
ADV2:  0.017653074423683208 0.8437394229205546 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4293   0.7473   3.7923  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0009   0.0036   5.4889   2.1784   2

***** Episode 67989, Mean R = -12.6  Std R = 4.9  Min R = -24.0
PolicyLoss: -0.0303
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000872
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.47e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.000912


ADV1:  -0.00038841477888382095 0.00685384528103872 0.15149692801032505 -0.08979470925751848
ADV2:  0.0032389553159846707 0.8074656143270411 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3431   0.9205   4.4774  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   5.4889   2.1784   2.1397
***** Episode 68020, Mean R = -12.7  Std R = 4.4  Min R = -22.7
PolicyLoss: -0.0015
Policy_Beta: 0.1
Policy_Entropy: 0.167
Policy_KL: 0.000708
Policy_SD: 0.548
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.47e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00063


ADV1:  0.0018367150977008824 0.005695392397493282 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3241   1.0620   5.1731  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0012   0.0045   5.4889   2.1784   2.1397
***** Episode 68268, Mean R = -12.6  Std R = 4.4  Min R = -27.7
PolicyLoss: -0.0133
Policy_Beta: 0.1
Policy_Entropy: 0.167
Policy_KL: 0.0011
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.48e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00045


ADV1:  -0.0010790366298258293 0.008709422058743603 0.055236364705059104 -0.061354410082361754
ADV2:  0.025349331672848936 0.8750065436166645 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.1083   2.9388  11.5136  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0028   5.4889   2.1784   2.1397
***** Episode 68299, Mean R = -12.8  Std R = 4.7  Min R = -24.0
PolicyLoss: -0.0222
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.00118
P

optical_flow |  0.0002  0.0001 |  0.0253  0.0236 | -1.0593 -1.2440 |  1.1814  1.0810
v_err    | -0.0096 |  0.0582 | -0.4541 |  0.1078
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -17.89 |    4.54 |  -43.38 |  -10.47
steps    |     377 |      20 |     328 |     417
***** Episode 68547, Mean R = -12.4  Std R = 5.1  Min R = -23.7
PolicyLoss: -0.00806
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.001
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.49e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00115


ADV1:  0.00016132208899443 0.005336054423613222 0.04546564550049065 -0.032994869692049504
ADV2:  -0.010003879182760004 0.8867593558616171 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   7.0482   4.6515  16.1081  24.0260  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0009   5.4889   2.1784   2.1397
*

attitude |    0.14   -0.06    0.03 |    1.13    0.64    1.81 |   -3.14   -1.48   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05    0.07 |    0.64    1.81 |   -1.41   -3.13 |    1.33    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.04    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.44
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.96 |    1.00    0.97
cs_angles |  0.0018  0.0042 |  0.0771  0.0842 | -0.9983 -0.9558 |  0.9954  0.9694
optical_flow |  0.0001  0.0002 |  0.0261  0.0251 | -1.1236 -1.2075 |  1.2268  1.2908
v_err    | -0.0099 |  0.0581 | -0.4528 |  0.1036
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.06   -0.04 |    0.63    1.91 |   -1.45   -3.13 |    1.49    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.26 |    0.00 |    1.63
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0026  0.0041 |  0.0817  0.0798 | -0.9928 -0.9954 |  0.9995  0.9903
optical_flow |  0.0001 -0.0000 |  0.0256  0.0248 | -1.1296 -1.2103 |  1.0219  1.1254
v_err    | -0.0099 |  0.0584 | -0.4530 |  0.1042
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.06
tracking_rewards |  -18.26 |    4.81 |  -42.92 |  -10.07
steps    |     378 |  

attitude |    0.01   -0.05    0.00 |    1.13    0.65    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05    0.06 |    0.66    1.81 |   -1.51   -3.13 |    1.48    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.45
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.96 |    1.00    0.99
cs_angles |  0.0014  0.0029 |  0.0757  0.0797 | -0.9998 -0.9558 |  0.9981  0.9933
optical_flow |  0.0002 -0.0000 |  0.0253  0.0245 | -0.9518 -1.2907 |  1.2197  1.1519
v_err    | -0.0100 |  0.0585 | -0.4625 |  0.1065
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.08   -0.02    0.09 |    1.19    0.63    1.89 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.10 |    0.63    1.90 |   -1.45   -3.14 |    1.56    3.12
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.54
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -0.99 |    0.99    0.98
cs_angles |  0.0029  0.0016 |  0.0734  0.0813 | -0.9967 -0.9883 |  0.9855  0.9845
optical_flow | -0.0000  0.0001 |  0.0249  0.0246 | -1.1374 -1.0043 |  1.3303  1.2749
v_err    | -0.0104 |  0.0586 | -0.4522 |  0.1139
landing_rewards |    9.23 |    2.67 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.01    0.04   -0.05 |    1.27    0.66    1.92 |   -3.14   -1.51   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.05   -0.09 |    0.66    1.91 |   -1.42   -3.13 |    1.49    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.41
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.99    0.97
cs_angles |  0.0027  0.0022 |  0.0772  0.0784 | -0.9878 -0.9965 |  0.9927  0.9665
optical_flow |  0.0000 -0.0000 |  0.0267  0.0231 | -1.0675 -0.9794 |  1.1488  0.8704
v_err    | -0.0103 |  0.0584 | -0.4539 |  0.1001
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.01   -0.00   -0.01 |    1.19    0.70    1.83 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.00    0.07 |    0.70    1.82 |   -1.46   -3.13 |    1.53    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.43
seeker_angles |    0.00    0.01 |    0.08    0.08 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0020  0.0056 |  0.0782  0.0805 | -0.9936 -0.9965 |  0.9993  0.9859
optical_flow | -0.0000  0.0000 |  0.0257  0.0232 | -1.3521 -1.0146 |  1.1808  1.1251
v_err    | -0.0104 |  0.0580 | -0.4527 |  0.1024
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04    0.00 |    0.65    1.88 |   -1.39   -3.12 |    1.54    3.11
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.24 |    0.00 |    1.64
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -1.00 |    0.96    0.99
cs_angles |  0.0024  0.0026 |  0.0758  0.0768 | -0.9977 -0.9995 |  0.9569  0.9935
optical_flow | -0.0000  0.0000 |  0.0258  0.0237 | -1.2990 -1.0969 |  1.2090  1.3673
v_err    | -0.0104 |  0.0579 | -0.4531 |  0.1162
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -17.06 |    4.14 |  -32.91 |  -10.48
steps    |     379 |  

attitude |   -0.01    0.02   -0.00 |    1.24    0.67    1.88 |   -3.14   -1.56   -3.14 |    3.14    1.53    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.03 |    0.67    1.89 |   -1.40   -3.13 |    1.45    3.14
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.66
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.97   -0.99 |    1.00    1.00
cs_angles |  0.0007  0.0018 |  0.0755  0.0791 | -0.9729 -0.9891 |  0.9994  0.9974
optical_flow |  0.0001 -0.0001 |  0.0248  0.0222 | -1.0529 -1.2307 |  1.1515  0.8559
v_err    | -0.0104 |  0.0582 | -0.4520 |  0.1056
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01   -0.00   -0.06 |    1.18    0.65    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00   -0.10 |    0.64    1.86 |   -1.57   -3.14 |    1.55    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.65
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -1.00 |    0.99    0.99
cs_angles |  0.0034  0.0028 |  0.0749  0.0803 | -0.9954 -0.9964 |  0.9900  0.9936
optical_flow | -0.0000  0.0002 |  0.0245  0.0237 | -1.2773 -1.0400 |  1.4707  1.2125
v_err    | -0.0100 |  0.0576 | -0.4519 |  0.1027
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.00   -0.02   -0.16 |    1.18    0.65    1.87 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.13 |    0.65    1.88 |   -1.47   -3.12 |    1.40    3.13
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.43
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.99 |    1.00    0.99
cs_angles |  0.0011  0.0045 |  0.0732  0.0795 | -0.9897 -0.9870 |  0.9995  0.9891
optical_flow |  0.0000 -0.0000 |  0.0253  0.0227 | -1.1666 -1.0404 |  1.1252  1.0553
v_err    | -0.0102 |  0.0583 | -0.4530 |  0.1022
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03    0.01 |    0.63    1.87 |   -1.35   -3.13 |    1.33    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.41
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -1.00   -1.00 |    0.98    0.97
cs_angles | -0.0005  0.0036 |  0.0755  0.0804 | -0.9997 -0.9964 |  0.9751  0.9705
optical_flow |  0.0001  0.0001 |  0.0246  0.0243 | -1.2694 -1.2741 |  1.0327  1.1571
v_err    | -0.0098 |  0.0579 | -0.4517 |  0.1059
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.04
tracking_rewards |  -17.32 |    3.97 |  -33.05 |   -8.86
steps    |     378 |  

attitude |    0.14   -0.00    0.10 |    1.20    0.67    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.12 |    0.67    1.84 |   -1.47   -3.11 |    1.47    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.45
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -1.00 |    1.00    1.00
cs_angles |  0.0029  0.0038 |  0.0756  0.0816 | -0.9835 -0.9967 |  0.9976  0.9957
optical_flow | -0.0001  0.0001 |  0.0248  0.0238 | -0.9556 -1.1579 |  1.0272  1.1051
v_err    | -0.0099 |  0.0586 | -0.4512 |  0.1044
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.05   -0.04   -0.04 |    1.17    0.68    1.85 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04   -0.05 |    0.68    1.85 |   -1.56   -3.14 |    1.48    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.24 |    0.00 |    1.42
seeker_angles |    0.00    0.00 |    0.08    0.07 |   -1.00   -0.99 |    0.96    0.99
cs_angles |  0.0045  0.0029 |  0.0752  0.0744 | -0.9950 -0.9903 |  0.9623  0.9872
optical_flow | -0.0000 -0.0000 |  0.0246  0.0238 | -1.1411 -1.0974 |  1.0076  1.0932
v_err    | -0.0100 |  0.0580 | -0.4514 |  0.0993
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05    0.07 |    0.69    1.90 |   -1.44   -3.14 |    1.50    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.58
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.98   -1.00 |    0.97    1.00
cs_angles | -0.0001  0.0026 |  0.0770  0.0808 | -0.9835 -0.9992 |  0.9676  0.9992
optical_flow |  0.0001 -0.0001 |  0.0255  0.0245 | -1.2417 -1.1533 |  1.0857  1.1860
v_err    | -0.0101 |  0.0580 | -0.4524 |  0.1089
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -17.48 |    4.12 |  -34.18 |  -10.09
steps    |     377 |  

attitude |    0.09   -0.02    0.10 |    1.17    0.61    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.53    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03    0.11 |    0.62    1.88 |   -1.48   -3.12 |    1.42    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.47
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.96   -0.98 |    0.99    0.99
cs_angles |  0.0034  0.0008 |  0.0752  0.0789 | -0.9629 -0.9836 |  0.9930  0.9887
optical_flow |  0.0002  0.0001 |  0.0240  0.0235 | -1.0555 -0.9549 |  1.3576  1.0458
v_err    | -0.0100 |  0.0583 | -0.4506 |  0.1040
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.00    0.01 |    0.67    1.81 |   -1.48   -3.12 |    1.53    3.11
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.06 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.63
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -0.91 |    0.98    0.97
cs_angles |  0.0033  0.0038 |  0.0727  0.0806 | -0.9963 -0.9095 |  0.9783  0.9721
optical_flow |  0.0001  0.0000 |  0.0256  0.0232 | -1.0848 -1.0561 |  1.0754  1.1288
v_err    | -0.0102 |  0.0579 | -0.4523 |  0.1264
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -17.11 |    4.08 |  -38.45 |  -10.29
steps    |     379 |  

attitude |    0.04    0.01   -0.07 |    1.15    0.65    1.89 |   -3.14   -1.57   -3.14 |    3.14    1.49    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.17 |    0.66    1.89 |   -1.44   -3.14 |    1.44    3.12
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.47
seeker_angles |    0.00    0.01 |    0.08    0.08 |   -0.99   -0.99 |    0.99    1.00
cs_angles |  0.0042  0.0055 |  0.0784  0.0810 | -0.9917 -0.9932 |  0.9909  0.9971
optical_flow | -0.0000  0.0001 |  0.0253  0.0239 | -1.0895 -1.5202 |  1.1441  1.1055
v_err    | -0.0104 |  0.0582 | -0.4529 |  0.1027
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.00    0.00 |    0.68    0.69    0.69 |   -3.43   -3.38   -3.44 |    3.45    3.46    3.39
norm_thrust |    0.91 |    0.77 |    0.00 |    3.46
fuel     |    1.56 |    0.19 |    1.13 |    2.07
rewards  |  -12.34 |    5.48 |  -36.15 |   -3.63
fuel_rewards |   -4.47 |    0.55 |   -5.95 |   -3.23
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.04 |   13.31 |    0.01 |  907.97
norm_af  |    1.80 |    0.90 |    0.07 |    3.28
norm_wf  |    0.02 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.03    0.00    0.09 |    1.18    0.64    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01    0.03 |    0.63

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7111   0.7078   3.1992  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0010   0.0036   5.4889   2.1784   2.1397
Update Cnt = 2400    ET =    987.3   Stats:  Mean, Std, Min, Max
r_f      |   24.49   -3.50    1.37 |  177.99  176.15  202.20 | -393.81 -372.48 -381.66 |  388.42  382.74  390.70
v_f      |   -0.01   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.11   -0.09   -0.10 |    0.09    0.11    0.10
r_i      |   90.58   11.99   19.12 |  665.01  676.07  757.50 |-1330.19-1245.17-1285.58 | 1281.00 1218.12 1325.49
v_i      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.09    0.09
norm_rf  |    0.19 |    0.08 |    0.06 |    0.46
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.21 |    1.76 |    0.01 |   15.11
thrust   |   -0.00   -0.00   -0.00 |    0.68    0.68    0.68 |   -3.41   -3.45   -3.44 |    3.42    3.37    3.41
norm_thrust |    

Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -2.1000063794321756e-05 0.008393698390976567 0.049953041993087255 -0.07233780681057292
ADV2:  0.027611469578667242 0.8372827137583349 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6274   0.6062   2.9877  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0022   5.4889   2.1784   2.1397
***** Episode 74716, Mean R = -11.8  Std R = 5.6  Min R = -30.2
PolicyLoss: -0.0325
Policy_Beta: 0.1
Policy_Entropy: 0.172
Policy_KL: 0.00235
Policy_SD: 0.521
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.72e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.00142


ADV1:  0.0012037838736474833 0.007032233968884843 0.04046878720119157 -0.07147634089254051
ADV2:  0.010068795304489562 0.840985297879395 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2068   1.2728   7.0907  24.5266  15.5251  10.0673
ValFun

Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.00029249906573292474 0.0071065903696244485 0.05416047446632416 -0.04657275266003066
ADV2:  0.02298077386953245 0.8271792813171225 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7491   0.8666   4.1335  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0012   5.4889   2.1784   2.1397
***** Episode 74995, Mean R = -11.4  Std R = 4.5  Min R = -26.9
PolicyLoss: -0.0245
Policy_Beta: 0.1
Policy_Entropy: 0.169
Policy_KL: 0.000821
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.73e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 5.19e-05


ADV1:  0.00011123467891252692 0.006386929180434083 0.07161767929134011 -0.05923723252784957
ADV2:  0.02403780272414781 0.8119544370953543 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2808   1.4544   7.0828  24.5266  15.5251  10.0673
ValF

***** Episode 75243, Mean R = -12.7  Std R = 5.0  Min R = -24.4
PolicyLoss: -0.0316
Policy_Beta: 0.1
Policy_Entropy: 0.17
Policy_KL: 0.000853
Policy_SD: 0.546
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.74e+07
VF_0_ExplainedVarNew: 0.961
VF_0_ExplainedVarOld: 0.959
VF_0_Loss : 0.00167


ADV1:  -0.0018855256646000617 0.00695717528259908 0.04139710147448389 -0.06301692457899732
ADV2:  0.033502929935443314 0.8928707616099623 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4765   1.2505   5.5125  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0014   0.0053   5.4889   2.1784   2.1397
***** Episode 75274, Mean R = -13.5  Std R = 7.3  Min R = -44.1
PolicyLoss: -0.0185
Policy_Beta: 0.1
Policy_Entropy: 0.169
Policy_KL: 0.00104
Policy_SD: 0.549
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.74e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00126


ADV1:  0.0024736246270715815 0.007535026371412457 0.0458

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8423   1.7388   7.2873  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0015   0.0056   5.4889   2.1784   2.1397
***** Episode 75522, Mean R = -13.8  Std R = 4.7  Min R = -24.5
PolicyLoss: -0.0318
Policy_Beta: 0.1
Policy_Entropy: 0.17
Policy_KL: 0.00092
Policy_SD: 0.552
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.75e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.0018


ADV1:  0.0007325417491994812 0.008100325210587511 0.061775263029201666 -0.06622392264629776
ADV2:  0.021035626959146077 0.8061542191135573 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4224   0.6888   2.9738  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0019   5.4889   2.1784   2.1397
***** Episode 75553, Mean R = -12.8  Std R = 5.2  Min R = -29.5
PolicyLoss: -0.0319
Policy_Beta: 0.1
Policy_Entropy: 0.17
Policy_KL: 0.000875
Polic

ADV1:  0.0015358533051640848 0.006767944181039177 0.04871487554446219 -0.05070333123207088
ADV2:  0.0011409831993186585 0.8588363682156857 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5319   1.0907   5.3336  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0012   0.0041   5.4889   2.1784   2.1397
***** Episode 75801, Mean R = -12.5  Std R = 4.3  Min R = -28.3
PolicyLoss: -0.0236
Policy_Beta: 0.1
Policy_Entropy: 0.168
Policy_KL: 0.000795
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.76e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.0015


ADV1:  0.00016866071915526393 0.005694792208775264 0.07350648097072104 -0.046031766427564846
ADV2:  0.003922939515792369 0.8962441695255636 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6136   0.6626   3.3802  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0006   5.4889   2.1784   2.

ADV1:  -8.960391242735084e-05 0.008961831004713039 0.029014884127202628 -0.061300601889177186
ADV2:  0.03053648188053065 0.8362010880244594 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6172   1.6242   5.5425  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0001   0.0001   0.0004   5.4889   2.1784   2.1397
***** Episode 76080, Mean R = -12.2  Std R = 4.9  Min R = -25.9
PolicyLoss: -0.0347
Policy_Beta: 0.1
Policy_Entropy: 0.168
Policy_KL: 0.00106
Policy_SD: 0.545
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.77e+07
VF_0_ExplainedVarNew: 0.963
VF_0_ExplainedVarOld: 0.959
VF_0_Loss : 0.0015


ADV1:  0.00044109156432375115 0.005200892552162162 0.0385684076832864 -0.044672609184677414
ADV2:  -0.004104368431190891 0.9254117871162293 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1413   1.4825   6.5164  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   5.4889   2.1784   2.

ADV1:  0.001637900337833019 0.005494352858434515 0.03811732073624933 -0.054715136149237065
ADV2:  -0.0116381261543719 0.8870361639430933 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5252   1.9503   7.0532  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0012   0.0042   5.4889   2.1784   2.1397
***** Episode 76359, Mean R = -11.1  Std R = 3.4  Min R = -18.2
PolicyLoss: -0.0118
Policy_Beta: 0.1
Policy_Entropy: 0.172
Policy_KL: 0.000854
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.78e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 5.88e-05


ADV1:  -0.0023570354487759226 0.008920907844189831 0.03666920949974489 -0.06333408985154634
ADV2:  0.04805217011447051 0.8334504418966685 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6312   1.4354   7.2644  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0016   0.0061   5.4889   2.1784   2.13

ADV1:  0.0001529143378126257 0.004913186001207395 0.04092289637555552 -0.05868130267419025
ADV2:  0.0012119687670060235 0.8692356506424797 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6060   0.6969   3.2926  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0003   0.0010   5.4889   2.1784   2.1397
***** Episode 76638, Mean R = -10.2  Std R = 3.6  Min R = -21.1
PolicyLoss: -0.00715
Policy_Beta: 0.1
Policy_Entropy: 0.172
Policy_KL: 0.000929
Policy_SD: 0.529
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.79e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00582


ADV1:  0.0010902392287510112 0.005125759047828589 0.06963404600294082 -0.03663830359942988
ADV2:  -0.019667819241591316 0.896247349228904 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5933   0.8238   3.1106  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0031   5.4889   2.1784   2.

seeker_angles |    0.01    0.00 |    0.07    0.08 |   -0.96   -0.98 |    1.00    0.98
cs_angles |  0.0050  0.0038 |  0.0725  0.0780 | -0.9630 -0.9752 |  0.9967  0.9810
optical_flow |  0.0000 -0.0000 |  0.0241  0.0235 | -1.0917 -1.0422 |  1.0759  1.0871
v_err    | -0.0105 |  0.0585 | -0.4534 |  0.0963
landing_rewards |    9.84 |    1.26 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -16.69 |    3.84 |  -33.37 |   -8.83
steps    |     377 |      19 |     335 |     411
***** Episode 76917, Mean R = -11.1  Std R = 4.0  Min R = -19.9
PolicyLoss: 0.00242
Policy_Beta: 0.1
Policy_Entropy: 0.169
Policy_KL: 0.000626
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.8e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.00111


ADV1:  0.00031634236684110323 0.005190743051153215 0.042737739563814214 -0.03720982105334408
ADV2:  0.0006742287670991109 0.8953611116694491 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/M

attitude |    0.07   -0.03    0.01 |    1.19    0.64    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04    0.06 |    0.64    1.90 |   -1.52   -3.10 |    1.51    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.26 |    0.00 |    1.58
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -1.00 |    1.00    0.99
cs_angles |  0.0029  0.0030 |  0.0768  0.0810 | -0.9791 -0.9987 |  0.9984  0.9880
optical_flow |  0.0001  0.0000 |  0.0243  0.0241 | -1.0785 -1.2228 |  1.0411  1.0841
v_err    | -0.0102 |  0.0583 | -0.4521 |  0.0989
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.02   -0.03   -0.07 |    1.17    0.65    1.85 |   -3.14   -1.49   -3.14 |    3.14    1.51    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02   -0.05 |    0.65    1.85 |   -1.43   -3.14 |    1.46    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.26 |    0.00 |    1.59
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.98    0.94
cs_angles |  0.0015  0.0044 |  0.0782  0.0795 | -0.9918 -0.9993 |  0.9820  0.9416
optical_flow |  0.0000  0.0000 |  0.0244  0.0237 | -1.1079 -1.2929 |  1.1031  0.9937
v_err    | -0.0106 |  0.0589 | -0.4524 |  0.1100
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.05    0.01    0.18 |    1.16    0.66    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.07 |    0.66    1.84 |   -1.39   -3.14 |    1.44    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.74
seeker_angles |    0.00    0.01 |    0.08    0.08 |   -0.99   -0.99 |    0.99    1.00
cs_angles |  0.0029  0.0051 |  0.0751  0.0786 | -0.9946 -0.9927 |  0.9922  0.9999
optical_flow | -0.0001 -0.0001 |  0.0243  0.0232 | -1.0037 -1.0048 |  1.0558  1.1928
v_err    | -0.0105 |  0.0583 | -0.4522 |  0.1150
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.05   -0.02   -0.08 |    1.14    0.66    1.83 |   -3.14   -1.53   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.18 |    0.66    1.83 |   -1.38   -3.14 |    1.45    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.03
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.46
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.97 |    0.99    1.00
cs_angles |  0.0025  0.0047 |  0.0759  0.0802 | -0.9792 -0.9722 |  0.9874  0.9963
optical_flow |  0.0001 -0.0000 |  0.0250  0.0238 | -1.1819 -1.1654 |  1.1106  1.0422
v_err    | -0.0102 |  0.0581 | -0.4532 |  0.1031
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01    0.01   -0.28 |    1.05    0.64    1.77 |   -3.14   -1.52   -3.14 |    3.12    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.20 |    0.65    1.79 |   -1.37   -3.11 |    1.52    3.09
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.35
seeker_angles |    0.01    0.00 |    0.08    0.08 |   -1.00   -0.92 |    0.97    0.99
cs_angles |  0.0054  0.0033 |  0.0757  0.0800 | -0.9966 -0.9156 |  0.9728  0.9944
optical_flow | -0.0001 -0.0000 |  0.0236  0.0216 | -1.1648 -1.2279 |  0.8625  0.9500
v_err    | -0.0102 |  0.0584 | -0.4531 |  0.1015
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.04   -0.03   -0.02 |    1.15    0.63    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03   -0.01 |    0.64    1.81 |   -1.52   -3.11 |    1.44    3.12
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.03    0.03
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.53
seeker_angles |    0.01    0.01 |    0.08    0.08 |   -0.95   -0.99 |    0.97    0.98
cs_angles |  0.0066  0.0058 |  0.0783  0.0804 | -0.9465 -0.9925 |  0.9716  0.9837
optical_flow |  0.0000  0.0001 |  0.0237  0.0244 | -1.1135 -1.1014 |  1.0997  0.9228
v_err    | -0.0102 |  0.0582 | -0.4518 |  0.1044
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.03    0.03    0.16 |    1.15    0.66    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03    0.10 |    0.66    1.85 |   -1.39   -3.11 |    1.54    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.01   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.45
seeker_angles |    0.01    0.00 |    0.08    0.08 |   -1.00   -0.94 |    0.96    0.99
cs_angles |  0.0067  0.0035 |  0.0754  0.0777 | -0.9999 -0.9414 |  0.9587  0.9928
optical_flow |  0.0000  0.0000 |  0.0239  0.0228 | -1.3361 -0.9180 |  0.8356  1.1161
v_err    | -0.0103 |  0.0577 | -0.4536 |  0.1085
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.15   -0.02    0.10 |    1.12    0.67    1.79 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.11 |    0.67    1.80 |   -1.46   -3.10 |    1.52    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.54
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.96   -0.99 |    0.97    1.00
cs_angles |  0.0035  0.0017 |  0.0767  0.0753 | -0.9590 -0.9893 |  0.9730  0.9960
optical_flow |  0.0000  0.0001 |  0.0239  0.0234 | -1.0234 -1.0442 |  1.1572  1.1315
v_err    | -0.0106 |  0.0583 | -0.4523 |  0.1060
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.00   -0.00 |    0.67    0.69    0.68 |   -3.46   -3.46   -3.42 |    3.42    3.43    3.44
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.53 |    0.20 |    1.06 |    2.35
rewards  |  -12.10 |    5.33 |  -44.69 |   -4.10
fuel_rewards |   -4.38 |    0.58 |   -6.73 |   -3.04
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.96 |   13.05 |    0.01 |  694.29
norm_af  |    1.75 |    0.89 |    0.02 |    3.25
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.00    0.06    0.01 |    1.18    0.66    1.84 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.07    0.02 |    0.66

ADV1:  -0.0009618875874461912 0.006628496797027058 0.053542063965520026 -0.057129333962131046
ADV2:  0.029777387122090267 0.797029966748898 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.9044   1.3374   7.6360  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0006   0.0025   5.4889   2.1784   2.1397
Update Cnt = 2580    ET =   1111.1   Stats:  Mean, Std, Min, Max
r_f      |    1.85    9.70  -16.84 |  183.17  170.56  202.33 | -389.16 -376.19 -392.98 |  391.14  395.76  373.17
v_f      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.11   -0.09   -0.09 |    0.09    0.08    0.10
r_i      |   12.48   22.81  -61.67 |  686.21  623.93  787.94 |-1330.75-1373.34-1321.23 | 1285.62 1375.23 1327.07
v_i      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.09    0.09    0.10
norm_rf  |    0.19 |    0.08 |    0.03 |    0.47
norm_vf  |    0.07 |    0.01 |    0.04 |    0.13
gs_f     |    1.36 |    2.01 |

Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.00039912235021855724 0.006859183896513463 0.05239221939128036 -0.06114964093787417
ADV2:  0.015231353296234717 0.8151057579224498 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7005   1.0229   6.0680  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0020   5.4889   2.1784   2.1397
***** Episode 80296, Mean R = -11.5  Std R = 4.1  Min R = -24.5
PolicyLoss: -0.0231
Policy_Beta: 0.1
Policy_Entropy: 0.175
Policy_KL: 0.000747
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.93e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.000223


ADV1:  -0.00040736426050575267 0.006958649945476478 0.04129103898295633 -0.07602353527972716
ADV2:  0.024697418042998596 0.857402197665931 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1063   0.9793   4.7669  24.5266  15.5251  10.0673
ValFu

***** Episode 80544, Mean R = -10.4  Std R = 4.0  Min R = -20.6
PolicyLoss: -0.0252
Policy_Beta: 0.1
Policy_Entropy: 0.177
Policy_KL: 0.000746
Policy_SD: 0.517
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.94e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.000633


ADV1:  -0.0012580154049533748 0.005124132041657572 0.0240677564233599 -0.04864702440539698
ADV2:  0.023721688955497987 0.9286087853910423 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2845   1.6968   9.1801  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0009   0.0032   5.4889   2.1784   2.1397
***** Episode 80575, Mean R = -10.7  Std R = 4.0  Min R = -23.3
PolicyLoss: -0.0098
Policy_Beta: 0.1
Policy_Entropy: 0.176
Policy_KL: 0.000915
Policy_SD: 0.521
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.94e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.00044


ADV1:  7.690712217061107e-06 0.007951219295281236 0.

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8725   1.7476   6.7523  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0020   5.4889   2.1784   2.1397
***** Episode 80823, Mean R = -12.8  Std R = 5.2  Min R = -27.2
PolicyLoss: -0.0241
Policy_Beta: 0.1
Policy_Entropy: 0.174
Policy_KL: 0.00086
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.95e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.00103


ADV1:  0.0023334654486849263 0.00799396179650261 0.05969916879368398 -0.09328041228644146
ADV2:  -0.0009403833719597959 0.8652282674373979 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1219   1.9865  10.7571  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0016   0.0061   5.4889   2.1784   2.1397
***** Episode 80854, Mean R = -13.2  Std R = 5.9  Min R = -29.2
PolicyLoss: -0.0223
Policy_Beta: 0.1
Policy_Entropy: 0.175
Policy_KL: 0.00103
Po

ADV1:  -0.0012710759924908813 0.0058135910116204155 0.033901317769203104 -0.06286512367008495
ADV2:  0.03094996166402599 0.8320865360925295 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8956   1.2836   7.0443  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0008   0.0032   5.4889   2.1784   2.1397
***** Episode 81102, Mean R = -10.1  Std R = 4.6  Min R = -28.3
PolicyLoss: -0.0215
Policy_Beta: 0.1
Policy_Entropy: 0.173
Policy_KL: 0.00108
Policy_SD: 0.524
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.96e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00116


ADV1:  0.0011032699645868351 0.006692236593756625 0.04915603105539079 -0.0541682564309233
ADV2:  0.00973495625724162 0.8435837909058695 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7976   1.0166   5.3498  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0029   5.4889   2.1784   2.139

***** Episode 81350, Mean R = -12.5  Std R = 3.6  Min R = -20.9
PolicyLoss: -0.0109
Policy_Beta: 0.1
Policy_Entropy: 0.175
Policy_KL: 0.000833
Policy_SD: 0.525
Policy_lr_mult: 0.198
Steps: 1.2e+04
TotalSteps: 2.97e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 7.54e-05


ADV1:  0.0017650285976011303 0.005580004014205959 0.04924389233096049 -0.04684687181592573
ADV2:  -0.003653735411875188 0.8649792604737365 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9218   1.2052   6.6924  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0017   0.0062   5.4889   2.1784   2.1397
***** Episode 81381, Mean R = -10.5  Std R = 5.4  Min R = -31.8
PolicyLoss: -0.0182
Policy_Beta: 0.1
Policy_Entropy: 0.175
Policy_KL: 0.000953
Policy_SD: 0.513
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.97e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.000164


ADV1:  -0.0025539363604779636 0.007099927292866394 

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1516   1.0985   5.3639  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0048   5.4889   2.1784   2.1397
***** Episode 81629, Mean R = -11.4  Std R = 3.8  Min R = -19.6
PolicyLoss: -0.00473
Policy_Beta: 0.1
Policy_Entropy: 0.174
Policy_KL: 0.000759
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.98e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00012


ADV1:  -0.001720042626212476 0.00821059883007364 0.03608688234511459 -0.07251118407850998
ADV2:  0.0442142132249822 0.8302246075126901 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.4992   2.2182  11.1528  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0012   0.0045   5.4889   2.1784   2.1397
***** Episode 81660, Mean R = -11.5  Std R = 6.1  Min R = -26.2
PolicyLoss: -0.0349
Policy_Beta: 0.1
Policy_Entropy: 0.172
Policy_KL: 0.000819
Poli

ADV1:  0.0028025704231546436 0.005798769834707605 0.0634167144912613 -0.07898302829976334
ADV2:  -0.027596090563560972 0.865047154342023 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.3695   2.1013  10.9770  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0019   0.0072   5.4889   2.1784   2.1397
***** Episode 81908, Mean R = -11.1  Std R = 4.0  Min R = -19.7
PolicyLoss: -0.008
Policy_Beta: 0.1
Policy_Entropy: 0.175
Policy_KL: 0.000947
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.99e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 3.34e-05


ADV1:  -0.0027878093380431686 0.009366272332341137 0.06845044658437116 -0.07378790868863762
ADV2:  0.03908762064234518 0.8687513748622694 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0253   1.7500   8.8678  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0018   0.0073   5.4889   2.1784   2.139

cs_angles |  0.0025  0.0042 |  0.0742  0.0773 | -0.9772 -0.9796 |  0.9962  0.9661
optical_flow | -0.0000 -0.0001 |  0.0251  0.0223 | -1.1081 -1.1721 |  1.1316  0.9095
v_err    | -0.0103 |  0.0580 | -0.4520 |  0.1036
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -16.57 |    3.57 |  -34.59 |   -9.89
steps    |     377 |      21 |     334 |     421
***** Episode 82187, Mean R = -12.2  Std R = 4.2  Min R = -25.1
PolicyLoss: -0.000952
Policy_Beta: 0.1
Policy_Entropy: 0.175
Policy_KL: 0.000952
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 2.47e-05


ADV1:  0.0009326786706380064 0.0069198617910617806 0.03868844378285419 -0.06165293463127965
ADV2:  0.01593999023480402 0.8219556961154653 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9198   0.3842   1.6154  24.5266  15.5251  10.0673
ValFun  Gradients: u

attitude |   -0.06   -0.02    0.16 |    1.19    0.66    1.85 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.21 |    0.65    1.84 |   -1.41   -3.12 |    1.47    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.60
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.96   -1.00 |    0.95    0.99
cs_angles |  0.0009  0.0031 |  0.0751  0.0789 | -0.9647 -0.9995 |  0.9494  0.9850
optical_flow |  0.0001  0.0001 |  0.0239  0.0237 | -1.0976 -1.1844 |  1.0039  1.4406
v_err    | -0.0103 |  0.0587 | -0.4521 |  0.1076
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.03   -0.03   -0.01 |    1.09    0.65    1.77 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03   -0.02 |    0.65    1.77 |   -1.52   -3.13 |    1.45    3.11
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.24 |    0.00 |    1.39
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.93    0.99
cs_angles |  0.0019  0.0049 |  0.0761  0.0777 | -0.9968 -0.9902 |  0.9286  0.9944
optical_flow |  0.0000 -0.0002 |  0.0230  0.0224 | -1.1602 -1.0776 |  1.0734  0.9726
v_err    | -0.0100 |  0.0584 | -0.4535 |  0.1102
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.00    0.00 |    0.66    0.68    0.68 |   -3.34   -3.44   -3.41 |    3.46    3.37    3.46
norm_thrust |    0.88 |    0.77 |    0.00 |    3.46
fuel     |    1.49 |    0.19 |    1.07 |    2.19
rewards  |  -11.65 |    4.64 |  -31.13 |   -3.68
fuel_rewards |   -4.27 |    0.53 |   -6.26 |   -3.06
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.80 |   12.49 |    0.01 |  330.80
norm_af  |    1.76 |    0.90 |    0.09 |    3.42
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.01   -0.02   -0.11 |    1.18    0.65    1.86 |   -3.14   -1.48   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02   -0.11 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9125   1.0530   5.6736  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0034   5.4889   2.1784   2.1397
Update Cnt = 2690    ET =   1172.1   Stats:  Mean, Std, Min, Max
r_f      |    4.18   -6.15   -5.32 |  188.77  165.57  205.40 | -387.16 -391.78 -390.82 |  393.64  345.43  388.51
v_f      |    0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.11   -0.11   -0.08 |    0.09    0.09    0.11
r_i      |   -3.59  -25.00  -27.47 |  710.01  630.93  775.71 |-1328.52-1286.01-1367.38 | 1362.29 1193.19 1314.35
v_i      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.10 |    0.09    0.08    0.10
norm_rf  |    0.19 |    0.08 |    0.03 |    0.45
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.52 |    3.16 |    0.00 |   39.65
thrust   |   -0.00    0.00    0.00 |    0.67    0.68    0.67 |   -3.46   -3.21   -3.44 |    3.45    3.44    3.42
norm_thrust |    

ADV1:  0.001986929483876325 0.009591498800551353 0.11440483865301643 -0.0561241106966894
ADV2:  -0.008786819466634304 0.8189821825233093 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3605   0.7246   3.7940  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0016   0.0053   5.4889   2.1784   2.1397
***** Episode 83706, Mean R = -12.5  Std R = 8.9  Min R = -54.5
PolicyLoss: -0.00702
Policy_Beta: 0.1
Policy_Entropy: 0.175
Policy_KL: 0.000963
Policy_SD: 0.527
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.06e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.00141


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.0012339410950400536 0.007671584609689144 0.046823596149578706 -0.05853637149869445
ADV2:  0.03888934584207472 0.8325296422238115 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9377   0.8258   4.6757  24.5266  15.5251  10.0673
ValFun

***** Episode 83954, Mean R = -11.7  Std R = 5.3  Min R = -30.3
PolicyLoss: -0.00421
Policy_Beta: 0.0667
Policy_Entropy: 0.174
Policy_KL: 0.00304
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.07e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00141


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.0014413896037560763 0.006831650870309326 0.060986666095689146 -0.0461855776133609
ADV2:  0.0024409641601909307 0.8457853438540861 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   9.3578   7.3137  19.6856  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0012   0.0043   5.4889   2.1784   2.1397
***** Episode 83985, Mean R = -11.6  Std R = 5.1  Min R = -25.2
PolicyLoss: -0.02
Policy_Beta: 0.0667
Policy_Entropy: 0.176
Policy_KL: 0.00172
Policy_SD: 0.53
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.07e+07
VF_0_ExplainedVarNew: 0.981
VF_0_Exp

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1144   1.0983   6.1153  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0016   5.4889   2.1784   2.1397
***** Episode 84233, Mean R = -10.7  Std R = 3.8  Min R = -21.0
PolicyLoss: -0.034
Policy_Beta: 0.1
Policy_Entropy: 0.176
Policy_KL: 0.000868
Policy_SD: 0.527
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.08e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 4.15e-05


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.0008733594133176807 0.00626506636610266 0.08781474359171088 -0.05772130867198655
ADV2:  0.02101381586621333 0.8530554819567854 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2483   0.8276   3.5996  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0023   5.4889   2.1784   2.1397
***** Episode 84264, Mean R = -12.2  Std R = 4.9  Mi

Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -9.145147261935395e-05 0.006924278189942177 0.042731242017342685 -0.05642389405961462
ADV2:  0.027285478702460765 0.8082714947437514 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6400   1.1101   5.3995  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0006   5.4889   2.1784   2.1397
***** Episode 84512, Mean R = -10.3  Std R = 4.6  Min R = -23.6
PolicyLoss: -0.0311
Policy_Beta: 0.1
Policy_Entropy: 0.176
Policy_KL: 0.000644
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.09e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.000164


ADV1:  -0.00063834055346067 0.006859550550169921 0.03955203716459932 -0.06263527573702549
ADV2:  0.036406077147075194 0.8026266517487 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1202   1.2584   6.9453  24.5266  15.5251  10.0673
ValFun  

Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.000929453995830357 0.007498252907897881 0.041616515280597455 -0.0899978816566731
ADV2:  0.017057196091377114 0.799672330744781 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4118   1.7656   8.7997  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0025   5.4889   2.1784   2.1397
***** Episode 84791, Mean R = -12.4  Std R = 5.7  Min R = -34.1
PolicyLoss: -0.0282
Policy_Beta: 0.1
Policy_Entropy: 0.173
Policy_KL: 0.000642
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.1e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 4.04e-05


ADV1:  -0.0005773878325776904 0.007000478697453011 0.048323414368062395 -0.052916029781797796
ADV2:  0.024671130778461885 0.8370987788927864 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3193   1.7353   8.4954  24.5266  15.5251  10.0673
ValFun

***** Episode 85039, Mean R = -13.3  Std R = 6.7  Min R = -29.0
PolicyLoss: -0.0238
Policy_Beta: 0.1
Policy_Entropy: 0.176
Policy_KL: 0.00117
Policy_SD: 0.526
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 3.11e+07
VF_0_ExplainedVarNew: 0.947
VF_0_ExplainedVarOld: 0.94
VF_0_Loss : 0.000191


ADV1:  0.005031948466034107 0.009216341755548342 0.10378051479101558 -0.09025078510744083
ADV2:  -0.019926239441805632 0.8163808172831699 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6300   0.9100   4.8674  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0056   0.0036   0.0130   5.4889   2.1784   2.1397
***** Episode 85070, Mean R = -12.0  Std R = 6.3  Min R = -30.8
PolicyLoss: -0.0208
Policy_Beta: 0.1
Policy_Entropy: 0.177
Policy_KL: 0.00127
Policy_SD: 0.521
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.11e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.965
VF_0_Loss : 0.00082


ADV1:  -0.0029922970283598007 0.006771110382870383 0.06

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4909   0.5390   2.9281  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0017   0.0060   5.4889   2.1784   2.1397
***** Episode 85318, Mean R = -11.3  Std R = 4.3  Min R = -24.0
PolicyLoss: -0.0227
Policy_Beta: 0.1
Policy_Entropy: 0.179
Policy_KL: 0.000985
Policy_SD: 0.525
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.12e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.00266


ADV1:  -0.0014056099773746419 0.006714567195738679 0.0556573680186091 -0.04663608435325555
ADV2:  0.029649943372495578 0.8630938794527357 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.3144   2.3423  10.0288  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0009   0.0036   5.4889   2.1784   2.1397
***** Episode 85349, Mean R = -12.7  Std R = 8.0  Min R = -44.3
PolicyLoss: -0.0215
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.000793
P

optical_flow |  0.0001  0.0001 |  0.0254  0.0228 | -1.4177 -1.3431 |  1.0929  1.0700
v_err    | -0.0101 |  0.0585 | -0.4533 |  0.1025
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.02
tracking_rewards |  -17.27 |    4.65 |  -47.87 |   -9.73
steps    |     377 |      20 |     330 |     418
***** Episode 85597, Mean R = -9.9  Std R = 4.0  Min R = -20.1
PolicyLoss: -0.0012
Policy_Beta: 0.15
Policy_Entropy: 0.178
Policy_KL: 0.0015
Policy_SD: 0.517
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.13e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.000183


ADV1:  -0.0010397813505670333 0.005316570042029763 0.047954278685723495 -0.04090605131702535
ADV2:  0.01879294365043789 0.9121459522945532 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8182   1.1049   5.7594  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0011   0.0042   5.4889   2.1784   2.1397


w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.07   -0.04 |    0.62    1.94 |   -1.35   -3.14 |    1.41    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.71
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.98   -0.97 |    0.99    0.99
cs_angles |  0.0035  0.0024 |  0.0749  0.0801 | -0.9765 -0.9738 |  0.9911  0.9940
optical_flow | -0.0000  0.0001 |  0.0249  0.0232 | -1.0646 -1.1065 |  1.0128  1.1134
v_err    | -0.0099 |  0.0580 | -0.4524 |  0.1009
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.89 |    3.81 |  -32.05 |  -10.16
steps    |     377 |  

norm_thrust |    0.88 |    0.76 |    0.00 |    3.46
fuel     |    1.49 |    0.17 |    1.02 |    1.96
rewards  |  -11.29 |    4.57 |  -36.79 |   -3.42
fuel_rewards |   -4.27 |    0.48 |   -5.62 |   -2.93
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.01 |   13.12 |    0.01 |  557.25
norm_af  |    1.72 |    0.89 |    0.06 |    3.33
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.05   -0.10   -0.09 |    1.14    0.66    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.10   -0.05 |    0.67    1.81 |   -1.55   -3.12 |    1.54    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0035   5.4889   2.1784   2.1397
Update Cnt = 2790    ET =   1230.6   Stats:  Mean, Std, Min, Max
r_f      |   -3.53   -5.11  -18.13 |  184.56  174.55  196.79 | -371.95 -365.07 -391.12 |  384.24  386.19  379.56
v_f      |   -0.00    0.00    0.01 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.10    0.09
r_i      |  -23.46   -5.52  -84.26 |  679.89  658.74  758.93 |-1348.86-1229.45-1350.66 | 1369.15 1311.60 1277.23
v_i      |    0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.09    0.09    0.09
norm_rf  |    0.18 |    0.08 |    0.02 |    0.46
norm_vf  |    0.07 |    0.01 |    0.05 |    0.12
gs_f     |    1.14 |    1.37 |    0.01 |   14.64
thrust   |    0.00   -0.00   -0.00 |    0.67    0.68    0.68 |   -3.46   -3.43   -3.46 |    3.41    3.41    3.46
norm_thrust |    0.88 |    0.77 |    0.00 |    3.46
fuel     |    1.49 |    0.18 |    1.03 |    2.06
rewards  |  -11.81 

ADV1:  0.0012897526039192392 0.008238099097952048 0.039113284472702625 -0.0625551257226454
ADV2:  0.01437534714090114 0.8378625591997972 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8339   1.1237   5.7757  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0011   0.0039   5.4889   2.1784   2.1397
***** Episode 86806, Mean R = -10.8  Std R = 4.7  Min R = -25.2
PolicyLoss: -0.0307
Policy_Beta: 0.1
Policy_Entropy: 0.177
Policy_KL: 0.000742
Policy_SD: 0.515
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.18e+07
VF_0_ExplainedVarNew: 0.967
VF_0_ExplainedVarOld: 0.963
VF_0_Loss : 0.000155


ADV1:  -0.001238404907440419 0.007309432195943314 0.03960920713338184 -0.06170225170214261
ADV2:  0.04282260073270082 0.8054878224565581 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9855   1.2950   5.6709  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0011   0.0040   5.4889   2.1784   2.139

ADV1:  -0.002167190842489467 0.008729934077849633 0.028546298770568468 -0.07186152715658595
ADV2:  0.04579663543282724 0.8466040696496852 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8300   0.9333   5.0104  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0056   5.4889   2.1784   2.1397
***** Episode 87085, Mean R = -11.0  Std R = 4.2  Min R = -20.8
PolicyLoss: -0.0336
Policy_Beta: 0.1
Policy_Entropy: 0.179
Policy_KL: 0.000796
Policy_SD: 0.51
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.19e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.961
VF_0_Loss : 6.85e-05


ADV1:  -0.0001737873237667577 0.005606931377798285 0.047018789052857723 -0.046419461242741746
ADV2:  0.005843480135768038 0.8988790607273086 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5913   1.5411   5.5057  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0017   5.4889   2.1784   2

ADV1:  0.0018841746226866305 0.005254997127467997 0.026404850676470405 -0.05749623816092475
ADV2:  -0.01784402643016746 0.9158751630676463 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7485   0.7314   4.1039  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0049   5.4889   2.1784   2.1397
***** Episode 87364, Mean R = -9.5  Std R = 3.1  Min R = -16.6
PolicyLoss: -0.0118
Policy_Beta: 0.1
Policy_Entropy: 0.177
Policy_KL: 0.000923
Policy_SD: 0.514
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.2e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.000454


ADV1:  -0.0005625492176464762 0.006167379417529236 0.043221153222812836 -0.10266335753112221
ADV2:  0.025275377297515868 0.8291512174122402 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8019   0.7140   3.2095  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0018   5.4889   2.1784   2.

ADV1:  -0.0008357335959026821 0.009585695324255728 0.03958045480330141 -0.06725865988596424
ADV2:  0.027311630509412113 0.8802514927843771 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.7832   2.0418   8.2646  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0022   5.4889   2.1784   2.1397
***** Episode 87643, Mean R = -11.5  Std R = 4.4  Min R = -24.4
PolicyLoss: -0.0252
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.00101
Policy_SD: 0.513
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.21e+07
VF_0_ExplainedVarNew: 0.952
VF_0_ExplainedVarOld: 0.947
VF_0_Loss : 0.00149


ADV1:  0.003210351921659073 0.0054893614818944635 0.031498925335994965 -0.04481263161083221
ADV2:  -0.03226964252786141 0.9126340954796158 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3992   0.8434   3.9887  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0083   5.4889   2.1784   2.1

***** Episode 87891, Mean R = -11.6  Std R = 5.0  Min R = -24.7
PolicyLoss: -0.000768
Policy_Beta: 0.1
Policy_Entropy: 0.18
Policy_KL: 0.000943
Policy_SD: 0.527
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.22e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000964


ADV1:  -0.003158348127375604 0.007501184885274455 0.02764489718054547 -0.05184276251995594
ADV2:  0.05276212593617195 0.8681702869404132 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2645   0.8799   4.0460  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0083   5.4889   2.1784   2.1397
***** Episode 87922, Mean R = -11.2  Std R = 4.6  Min R = -22.7
PolicyLoss: -0.0276
Policy_Beta: 0.1
Policy_Entropy: 0.179
Policy_KL: 0.000823
Policy_SD: 0.521
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.22e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.971
VF_0_Loss : 0.00109


ADV1:  0.0009016108819996004 0.006788074869419824 0.

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6263   0.5981   3.3378  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0030   5.4889   2.1784   2.1397
***** Episode 88170, Mean R = -11.2  Std R = 4.1  Min R = -23.5
PolicyLoss: -0.0345
Policy_Beta: 0.1
Policy_Entropy: 0.177
Policy_KL: 0.000853
Policy_SD: 0.532
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.23e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00012


ADV1:  -0.0014536088832399112 0.007836373034615042 0.03955552160739903 -0.06917630648328049
ADV2:  0.03121805574296947 0.8774058458691787 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4909   1.6032   6.6480  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0011   0.0041   5.4889   2.1784   2.1397
***** Episode 88201, Mean R = -11.4  Std R = 5.1  Min R = -26.6
PolicyLoss: -0.0237
Policy_Beta: 0.1
Policy_Entropy: 0.177
Policy_KL: 0.00114
Pol

ADV1:  -0.0014623012517917587 0.005816434864921713 0.062474551703249004 -0.08402408790933685
ADV2:  0.02944347933822428 0.8641183678112698 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   6.3970   3.2595  12.5034  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0038   5.4889   2.1784   2.1397
***** Episode 88449, Mean R = -10.8  Std R = 3.7  Min R = -19.2
PolicyLoss: -0.0156
Policy_Beta: 0.1
Policy_Entropy: 0.18
Policy_KL: 0.00112
Policy_SD: 0.511
Policy_lr_mult: 0.198
Steps: 1.2e+04
TotalSteps: 3.24e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.000121


ADV1:  0.0011835406278810899 0.00544628671323809 0.060005066759367565 -0.06348182002535285
ADV2:  -0.025571384877608235 0.8533830158041661 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0557   0.9623   3.9885  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0032   5.4889   2.1784   2.13

ADV1:  0.0021611237072382485 0.007953226138493063 0.03774202680971506 -0.12038959409835887
ADV2:  0.01662121868254125 0.7827737856354521 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1178   1.3407   6.8404  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0015   0.0056   5.4889   2.1784   2.1397
***** Episode 88728, Mean R = -12.4  Std R = 5.9  Min R = -37.7
PolicyLoss: -0.0375
Policy_Beta: 0.1
Policy_Entropy: 0.177
Policy_KL: 0.000787
Policy_SD: 0.523
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.25e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 6.84e-05


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.002001053711255426 0.006334251661145944 0.06754031708856292 -0.0640541934457981
ADV2:  0.01727347312798488 0.8587961607173545 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2630   0.4643   2.6150  24.5266  15.5251  10.0673
ValFun  G

theta_cv |    0.23 |    0.25 |    0.00 |    1.66
seeker_angles |    0.01    0.00 |    0.08    0.08 |   -0.98   -0.96 |    0.98    0.99
cs_angles |  0.0060  0.0031 |  0.0781  0.0776 | -0.9778 -0.9612 |  0.9766  0.9856
optical_flow | -0.0000 -0.0000 |  0.0246  0.0233 | -1.0152 -1.1592 |  1.1422  1.2403
v_err    | -0.0102 |  0.0580 | -0.4524 |  0.1166
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.87 |    4.09 |  -42.86 |   -9.61
steps    |     377 |      20 |     333 |     416
***** Episode 89007, Mean R = -11.0  Std R = 4.1  Min R = -17.9
PolicyLoss: -0.029
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.00106
Policy_SD: 0.522
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.26e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.000336


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.0006945701907017835 0.004972632732

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01    0.08 |    0.65    1.93 |   -1.49   -3.13 |    1.48    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.04    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.48
seeker_angles |    0.01    0.00 |    0.07    0.08 |   -0.97   -0.99 |    0.99    1.00
cs_angles |  0.0053  0.0032 |  0.0720  0.0803 | -0.9703 -0.9887 |  0.9936  0.9964
optical_flow | -0.0000 -0.0000 |  0.0243  0.0238 | -1.1594 -1.0003 |  1.3050  1.0636
v_err    | -0.0104 |  0.0583 | -0.4525 |  0.0961
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.03
tracking_rewards |  -16.66 |    3.87 |  -31.39 |   -8.83
steps    |     377 |  

w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.12 |    0.67    1.85 |   -1.47   -3.11 |    1.55    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.03 |    0.02    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.55
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.99 |    0.99    1.00
cs_angles |  0.0037  0.0017 |  0.0747  0.0763 | -0.9852 -0.9887 |  0.9931  0.9991
optical_flow |  0.0001  0.0000 |  0.0243  0.0216 | -1.1768 -1.0622 |  1.2990  0.7992
v_err    | -0.0104 |  0.0581 | -0.4524 |  0.1010
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -16.53 |    3.62 |  -29.28 |   -9.97
steps    |     378 |  

attitude |    0.01   -0.06   -0.08 |    1.17    0.64    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05   -0.12 |    0.65    1.84 |   -1.56   -3.13 |    1.52    3.11
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.47
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0028 -0.0003 |  0.0755  0.0800 | -0.9950 -0.9993 |  0.9993  0.9982
optical_flow | -0.0000 -0.0001 |  0.0243  0.0230 | -1.1345 -1.0985 |  0.9932  1.0154
v_err    | -0.0103 |  0.0580 | -0.4527 |  0.1059
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.06 |    0.68    1.87 |   -1.46   -3.14 |    1.52    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.26 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    0.99    1.00
cs_angles |  0.0012  0.0032 |  0.0757  0.0803 | -0.9869 -0.9927 |  0.9912  0.9982
optical_flow |  0.0001 -0.0001 |  0.0248  0.0235 | -1.1298 -1.2622 |  1.0567  1.2179
v_err    | -0.0102 |  0.0579 | -0.4527 |  0.1059
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -16.93 |    3.75 |  -28.70 |  -10.15
steps    |     378 |  

attitude |    0.08    0.02   -0.10 |    1.09    0.60    1.83 |   -3.14   -1.45   -3.14 |    3.14    1.49    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.08 |    0.61    1.83 |   -1.45   -3.11 |    1.41    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.47
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.96 |    1.00    0.98
cs_angles |  0.0021  0.0007 |  0.0760  0.0776 | -0.9987 -0.9625 |  0.9990  0.9837
optical_flow | -0.0000  0.0000 |  0.0242  0.0231 | -1.1378 -1.3842 |  1.1234  1.2400
v_err    | -0.0100 |  0.0579 | -0.4528 |  0.1026
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.10   -0.01    0.09 |    1.12    0.66    1.79 |   -3.14   -1.57   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.03 |    0.66    1.80 |   -1.48   -3.13 |    1.45    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.26 |    0.00 |    1.47
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0019  0.0014 |  0.0764  0.0810 | -0.9865 -0.9975 |  0.9986  0.9995
optical_flow |  0.0001 -0.0000 |  0.0244  0.0231 | -1.2033 -1.1477 |  1.0541  1.2673
v_err    | -0.0098 |  0.0581 | -0.4523 |  0.1037
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01   -0.02    0.02 |    1.24    0.66    1.91 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.00 |    0.67    1.90 |   -1.51   -3.14 |    1.50    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.26 |    0.00 |    1.67
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.98 |    1.00    1.00
cs_angles |  0.0020  0.0005 |  0.0787  0.0806 | -0.9957 -0.9795 |  0.9988  0.9999
optical_flow |  0.0001  0.0001 |  0.0240  0.0222 | -1.0367 -1.0790 |  1.1900  1.1548
v_err    | -0.0100 |  0.0581 | -0.4536 |  0.1080
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.10    0.05    0.17 |    1.11    0.67    1.77 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.06    0.13 |    0.67    1.78 |   -1.48   -3.14 |    1.40    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.56
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -0.98   -0.99 |    1.00    1.00
cs_angles |  0.0011 -0.0002 |  0.0759  0.0796 | -0.9823 -0.9878 |  1.0000  0.9958
optical_flow |  0.0001  0.0001 |  0.0251  0.0241 | -1.0746 -1.1055 |  1.1837  1.1131
v_err    | -0.0103 |  0.0584 | -0.4529 |  0.1155
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

norm_thrust |    0.88 |    0.76 |    0.00 |    3.46
fuel     |    1.47 |    0.18 |    1.00 |    2.16
rewards  |  -11.19 |    5.07 |  -36.54 |   -3.21
fuel_rewards |   -4.22 |    0.53 |   -6.18 |   -2.86
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.82 |   12.65 |    0.01 |  405.69
norm_af  |    1.73 |    0.90 |    0.07 |    3.30
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.06    0.02    0.10 |    1.13    0.64    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03    0.03 |    0.63    1.84 |   -1.49   -3.13 |    1.34    3.14
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0025   5.4889   2.1784   2.1397
Update Cnt = 2970    ET =   1060.1   Stats:  Mean, Std, Min, Max
r_f      |    8.32   -1.19   14.97 |  183.43  171.08  201.04 | -384.27 -355.97 -379.84 |  398.29  380.78  390.18
v_f      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.10    0.09    0.10
r_i      |   72.50    9.31   29.65 |  674.11  647.28  778.37 |-1325.94-1251.56-1305.48 | 1334.13 1243.86 1357.11
v_i      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.10 |    0.09    0.09    0.09
norm_rf  |    0.18 |    0.07 |    0.04 |    0.52
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.63 |    5.06 |    0.01 |   79.58
thrust   |    0.00   -0.01    0.00 |    0.68    0.68    0.69 |   -3.42   -3.40   -3.45 |    3.40    3.31    3.45
norm_thrust |    0.90 |    0.77 |    0.00 |    3.46
fuel     |    1.51 |    0.19 |    1.01 |    2.23
rewards  |  -11.56 

ADV1:  0.0001049817210646039 0.007964188538312003 0.04009215447401382 -0.06161568492157503
ADV2:  0.025452713094888973 0.8463408900185585 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7947   1.8513   8.2010  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0001   0.0006   5.4889   2.1784   2.1397
***** Episode 92386, Mean R = -10.6  Std R = 3.9  Min R = -18.8
PolicyLoss: -0.0311
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.000974
Policy_SD: 0.53
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.39e+07
VF_0_ExplainedVarNew: 0.967
VF_0_ExplainedVarOld: 0.963
VF_0_Loss : 0.000237


ADV1:  0.0010110912104857644 0.00604535988558545 0.03971596341372241 -0.06911924732705987
ADV2:  -0.004287034179596044 0.8911668472160802 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0055   1.1824   5.1933  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0027   5.4889   2.1784   2.13

***** Episode 92634, Mean R = -11.3  Std R = 4.6  Min R = -21.8
PolicyLoss: -0.0124
Policy_Beta: 0.1
Policy_Entropy: 0.179
Policy_KL: 0.000875
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.4e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.00148


ADV1:  0.0007948286326162749 0.005167053110658103 0.03486175156417998 -0.06352115460626628
ADV2:  -0.004289185621789982 0.8900365255556815 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.2394   2.8043  10.9005  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0021   5.4889   2.1784   2.1397
***** Episode 92665, Mean R = -11.1  Std R = 4.9  Min R = -23.9
PolicyLoss: -0.0107
Policy_Beta: 0.1
Policy_Entropy: 0.179
Policy_KL: 0.00122
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.4e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000702


ADV1:  -0.0023260573771334415 0.008679654618197273 0.0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3239   1.1664   5.7279  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0042   5.4889   2.1784   2.1397
***** Episode 92913, Mean R = -12.3  Std R = 5.7  Min R = -30.3
PolicyLoss: -0.0372
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.00104
Policy_SD: 0.546
Policy_lr_mult: 0.198
Steps: 1.2e+04
TotalSteps: 3.41e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.0013


ADV1:  0.001179588544363944 0.007247519629926961 0.04386484735003282 -0.05289378878181796
ADV2:  0.012162235344912361 0.8494730098818233 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3956   1.4144   7.3473  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0034   5.4889   2.1784   2.1397
***** Episode 92944, Mean R = -12.5  Std R = 6.4  Min R = -36.6
PolicyLoss: -0.0258
Policy_Beta: 0.1
Policy_Entropy: 0.176
Policy_KL: 0.000968
Polic

ADV1:  -0.00016184750026065228 0.006523950436416184 0.03352255569988355 -0.057124720928791894
ADV2:  0.0241603087101137 0.8445166139910928 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4093   1.0063   4.2532  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0005   5.4889   2.1784   2.1397
***** Episode 93192, Mean R = -10.9  Std R = 4.6  Min R = -24.2
PolicyLoss: -0.027
Policy_Beta: 0.1
Policy_Entropy: 0.177
Policy_KL: 0.00118
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.42e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.000104


ADV1:  0.0012678199325785872 0.006385121882420469 0.0430401183878506 -0.06776409732769167
ADV2:  0.004686956834668853 0.8661245743997843 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7255   0.8162   3.4448  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0034   5.4889   2.1784   2.1397

ADV1:  0.0003185134584729123 0.005500376782814448 0.0625286133123904 -0.06080084220144538
ADV2:  -0.0006377910109958214 0.8699809545663281 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2010   1.9861   8.8556  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0008   5.4889   2.1784   2.1397
***** Episode 93471, Mean R = -11.1  Std R = 3.3  Min R = -17.4
PolicyLoss: -0.0069
Policy_Beta: 0.1
Policy_Entropy: 0.175
Policy_KL: 0.00092
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.43e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 2.31e-05


ADV1:  -4.575152390177009e-05 0.005127289062769854 0.041299636372798154 -0.0370651250793032
ADV2:  -0.00345035046813569 0.8942997407555237 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3754   1.2767   4.8184  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0004   5.4889   2.1784   2.1

ADV1:  -0.002500057488781548 0.004959401400133797 0.048931736628975264 -0.045780450517233784
ADV2:  0.04013514888574011 0.8982013072462521 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0271   0.9753   4.3493  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0017   0.0066   5.4889   2.1784   2.1397
***** Episode 93750, Mean R = -11.5  Std R = 3.6  Min R = -18.1
PolicyLoss: -0.000212
Policy_Beta: 0.1
Policy_Entropy: 0.176
Policy_KL: 0.00102
Policy_SD: 0.548
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.44e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 6.56e-05


ADV1:  -0.001995652126536715 0.0080715569460605 0.028607106259210036 -0.0656124062587849
ADV2:  0.04271335177863592 0.8459079843410816 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2698   1.1121   6.3512  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0015   0.0056   5.4889   2.1784   2.13

***** Episode 93998, Mean R = -10.8  Std R = 4.4  Min R = -22.1
PolicyLoss: -0.0056
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.000967
Policy_SD: 0.529
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.45e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000313


ADV1:  -0.0004463561882035415 0.00770639852677083 0.07643131588868152 -0.052904252034190136
ADV2:  0.0328119436793314 0.8091022124014924 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4265   0.9397   5.0515  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0012   5.4889   2.1784   2.1397
***** Episode 94029, Mean R = -11.3  Std R = 5.0  Min R = -29.8
PolicyLoss: -0.0326
Policy_Beta: 0.1
Policy_Entropy: 0.179
Policy_KL: 0.000748
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.45e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 0.00013


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.0018

***** Episode 94277, Mean R = -10.4  Std R = 4.4  Min R = -23.5
PolicyLoss: -0.0295
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.000907
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.46e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.000162


ADV1:  0.0008284129862799277 0.007675258272721823 0.045876181485030754 -0.05288447264831873
ADV2:  0.015849808278843677 0.8475775080696911 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.6948   1.5772   9.3607  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0022   5.4889   2.1784   2.1397
***** Episode 94308, Mean R = -12.8  Std R = 6.3  Min R = -36.7
PolicyLoss: -0.0279
Policy_Beta: 0.1
Policy_Entropy: 0.177
Policy_KL: 0.00104
Policy_SD: 0.552
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.46e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.000196


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00

seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -0.98   -0.97 |    0.97    1.00
cs_angles |  0.0009 -0.0003 |  0.0778  0.0782 | -0.9787 -0.9746 |  0.9728  0.9996
optical_flow | -0.0001 -0.0000 |  0.0241  0.0227 | -1.0597 -1.0406 |  1.2197  1.1774
v_err    | -0.0100 |  0.0581 | -0.4528 |  0.0957
landing_rewards |    9.81 |    1.38 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.01
tracking_rewards |  -16.70 |    4.38 |  -40.27 |   -9.33
steps    |     376 |      19 |     335 |     416
***** Episode 94587, Mean R = -12.4  Std R = 5.3  Min R = -26.4
PolicyLoss: -0.0278
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.000846
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.47e+07
VF_0_ExplainedVarNew: 0.963
VF_0_ExplainedVarOld: 0.957
VF_0_Loss : 0.000331


ADV1:  0.0016517739930009935 0.007982593950319068 0.06715327796990705 -0.08379827868012169
ADV2:  0.0075255669747665505 0.8137469159916995 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/M

attitude |    0.01   -0.05    0.11 |    1.21    0.65    1.89 |   -3.14   -1.51   -3.14 |    3.14    1.53    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04    0.11 |    0.66    1.88 |   -1.51   -3.14 |    1.53    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.42
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.97   -0.99 |    0.99    1.00
cs_angles |  0.0024  0.0026 |  0.0751  0.0782 | -0.9687 -0.9912 |  0.9868  0.9958
optical_flow | -0.0000 -0.0000 |  0.0234  0.0242 | -1.2052 -1.2220 |  0.9716  1.2749
v_err    | -0.0099 |  0.0579 | -0.4511 |  0.1029
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.01    0.00 |    0.68    0.69    0.68 |   -3.42   -3.36   -3.43 |    3.44    3.34    3.34
norm_thrust |    0.90 |    0.77 |    0.00 |    3.46
fuel     |    1.53 |    0.19 |    1.09 |    2.09
rewards  |  -11.33 |    4.93 |  -32.46 |   -2.99
fuel_rewards |   -4.38 |    0.56 |   -6.00 |   -3.16
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.66 |   12.45 |    0.01 |  753.56
norm_af  |    1.70 |    0.91 |    0.05 |    3.33
norm_wf  |    0.01 |    0.00 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.02   -0.08    0.11 |    1.17    0.68    1.79 |   -3.14   -1.52   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.09    0.05 |    0.68

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0018   1.5088   7.1915  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0016   5.4889   2.1784   2.1397
Update Cnt = 3080    ET =   1001.5   Stats:  Mean, Std, Min, Max
r_f      |  -18.18    5.36   10.38 |  186.66  174.44  196.64 | -397.68 -382.65 -367.46 |  387.62  385.15  383.82
v_f      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.08   -0.09   -0.09 |    0.09    0.14    0.11
r_i      |  -56.85   30.43   32.07 |  665.25  678.57  765.78 |-1311.74-1307.28-1329.76 | 1286.50 1304.12 1281.79
v_i      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.09    0.10
norm_rf  |    0.18 |    0.08 |    0.03 |    0.44
norm_vf  |    0.08 |    0.01 |    0.04 |    0.14
gs_f     |    1.21 |    1.47 |    0.01 |   10.58
thrust   |   -0.00   -0.00   -0.00 |    0.68    0.68    0.69 |   -3.44   -3.44   -3.38 |    3.40    3.36    3.44
norm_thrust |    

ADV1:  0.0005931151669634423 0.005017921176956801 0.039134096900421994 -0.046884963073944796
ADV2:  0.0005407743869271967 0.8729400782850937 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4782   0.9808   5.4516  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0009   0.0031   5.4889   2.1784   2.1397
***** Episode 95796, Mean R = -10.9  Std R = 3.8  Min R = -22.1
PolicyLoss: -0.015
Policy_Beta: 0.1
Policy_Entropy: 0.18
Policy_KL: 0.000772
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.52e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.00143


ADV1:  -0.0007402941498582082 0.00693229491677728 0.04092047196539081 -0.07482234417663097
ADV2:  0.030158243347109814 0.8357693889157964 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8484   0.7524   3.2395  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0019   5.4889   2.1784   2.13

***** Episode 96044, Mean R = -11.6  Std R = 4.9  Min R = -24.2
PolicyLoss: -0.0251
Policy_Beta: 0.1
Policy_Entropy: 0.179
Policy_KL: 0.000729
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.53e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.000101


ADV1:  -0.001945959440635077 0.007320550963028118 0.05895816194662579 -0.06943610021319435
ADV2:  0.03618812341220848 0.8607561968758195 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3924   0.8071   4.4824  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0014   0.0050   5.4889   2.1784   2.1397
***** Episode 96075, Mean R = -12.1  Std R = 5.9  Min R = -34.1
PolicyLoss: -0.0217
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.000918
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.53e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 5.29e-05


ADV1:  0.0021655499173316457 0.00691974591946796 0.0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2630   0.7957   3.7349  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0032   5.4889   2.1784   2.1397
***** Episode 96323, Mean R = -12.6  Std R = 5.7  Min R = -24.0
PolicyLoss: -0.0285
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.000704
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.54e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 6.68e-05


ADV1:  -0.0008604516576175527 0.006919732023191408 0.04442127070928026 -0.054731573492576326
ADV2:  0.023251231293801817 0.8755810028566637 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5981   1.0034   5.3030  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0030   5.4889   2.1784   2.1397
***** Episode 96354, Mean R = -12.3  Std R = 6.6  Min R = -29.7
PolicyLoss: -0.02
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.00102
Po

ADV1:  0.0012668462287084717 0.004890325145905439 0.04526032108812744 -0.03195673343343661
ADV2:  -0.012775895097017357 0.9249427279805876 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.6898   2.1388  10.2442  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0035   5.4889   2.1784   2.1397
***** Episode 96602, Mean R = -10.3  Std R = 3.3  Min R = -18.5
PolicyLoss: -0.00546
Policy_Beta: 0.1
Policy_Entropy: 0.177
Policy_KL: 0.000829
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.55e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 3.2e-05


ADV1:  -0.003049297583815632 0.006149227721567838 0.027579341530878154 -0.06343724202850554
ADV2:  0.061422260800671764 0.8436976846230471 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.4009   2.0217  10.8425  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0021   0.0081   5.4889   2.1784   2.

ADV1:  0.0016072966697374478 0.006255940168879368 0.03123855346653709 -0.06999123810163771
ADV2:  -0.004495449153948618 0.8823174970840615 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7130   0.6991   3.3378  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0013   0.0044   5.4889   2.1784   2.1397
***** Episode 96881, Mean R = -10.5  Std R = 4.7  Min R = -26.2
PolicyLoss: -0.018
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.000921
Policy_SD: 0.533
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.56e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00053


ADV1:  -0.0007009557248225922 0.005348183195878091 0.04574183436659679 -0.057392150377279294
ADV2:  0.019067856922549243 0.8788665946174375 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0220   1.2751   6.6872  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0025   5.4889   2.1784   2.1

ADV1:  0.0014567149571025836 0.004850033120062308 0.03956272226614438 -0.07422799424549897
ADV2:  -0.016474469263497823 0.8641870227969678 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0554   0.9383   4.9979  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0038   5.4889   2.1784   2.1397
***** Episode 97160, Mean R = -11.7  Std R = 4.7  Min R = -27.2
PolicyLoss: -0.0108
Policy_Beta: 0.1
Policy_Entropy: 0.18
Policy_KL: 0.000799
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.57e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 1.77e-05


ADV1:  -0.004092536540347869 0.011422960669949116 0.02795334117801429 -0.08101288922902006
ADV2:  0.04473493402655538 0.9099988749735318 2.7319482977444123 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5153   1.2447   6.6094  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0047   0.0029   0.0108   5.4889   

***** Episode 97408, Mean R = -11.0  Std R = 4.0  Min R = -19.8
PolicyLoss: -0.00514
Policy_Beta: 0.1
Policy_Entropy: 0.181
Policy_KL: 0.00115
Policy_SD: 0.524
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 3.58e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 2.48e-05


ADV1:  -0.0019806142757193305 0.006779119605432199 0.046207839954820085 -0.06151448001594166
ADV2:  0.048227562075324276 0.8089490344986774 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3523   0.5345   2.6168  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0014   0.0052   5.4889   2.1784   2.1397
***** Episode 97439, Mean R = -11.5  Std R = 5.0  Min R = -24.0
PolicyLoss: -0.0301
Policy_Beta: 0.1
Policy_Entropy: 0.18
Policy_KL: 0.000971
Policy_SD: 0.53
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.58e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 4.48e-05


ADV1:  -0.00010803484740535 0.008989552906886642 0.0

***** Episode 97687, Mean R = -10.0  Std R = 3.2  Min R = -19.5
PolicyLoss: -0.0219
Policy_Beta: 0.1
Policy_Entropy: 0.178
Policy_KL: 0.000851
Policy_SD: 0.518
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.59e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 4.42e-05


ADV1:  -0.0016659619081742772 0.008197497338128319 0.02844858229160313 -0.06987744615158975
ADV2:  0.04339843983058777 0.8406795499104741 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8926   1.3200   6.5697  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0016   0.0059   5.4889   2.1784   2.1397
***** Episode 97718, Mean R = -13.0  Std R = 6.2  Min R = -29.8
PolicyLoss: -0.032
Policy_Beta: 0.1
Policy_Entropy: 0.181
Policy_KL: 0.00115
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.59e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 5.7e-05


ADV1:  0.0004944813424539124 0.005174795038341465 0.03

cs_angles | -0.0006  0.0030 |  0.0759  0.0763 | -0.9954 -0.9764 |  0.9846  0.9447
optical_flow |  0.0000  0.0000 |  0.0232  0.0230 | -1.0525 -1.1466 |  1.0919  1.0480
v_err    | -0.0105 |  0.0576 | -0.4522 |  0.1132
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.03
tracking_rewards |  -16.65 |    3.88 |  -31.84 |   -9.39
steps    |     380 |      20 |     328 |     417
***** Episode 97997, Mean R = -11.7  Std R = 4.6  Min R = -22.7
PolicyLoss: -0.0348
Policy_Beta: 0.1
Policy_Entropy: 0.18
Policy_KL: 0.000796
Policy_SD: 0.53
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 3.6e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 8.03e-05


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.0039580426225799435 0.005223247756184881 0.05011827603279956 -0.0649009058423839
ADV2:  -0.044620214941565615 0.8732706733835696 3.0 -3.0
Policy  Gradients: u/sd/Max/C Ma

attitude |   -0.10    0.00   -0.17 |    1.15    0.63    1.86 |   -3.14   -1.54   -3.14 |    3.14    1.53    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.14 |    0.63    1.86 |   -1.42   -3.13 |    1.37    3.11
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.67
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.98   -0.99 |    0.89    0.97
cs_angles | -0.0003  0.0011 |  0.0752  0.0802 | -0.9797 -0.9857 |  0.8940  0.9731
optical_flow | -0.0001 -0.0001 |  0.0240  0.0222 | -1.1793 -1.1381 |  1.1009  1.1092
v_err    | -0.0103 |  0.0575 | -0.4515 |  0.0953
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.12 |    0.68    1.79 |   -1.48   -3.14 |    1.52    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.49
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.98   -0.95 |    0.99    0.98
cs_angles | -0.0013  0.0025 |  0.0759  0.0762 | -0.9842 -0.9456 |  0.9943  0.9841
optical_flow | -0.0001  0.0001 |  0.0252  0.0231 | -1.2475 -1.0740 |  1.1592  1.1522
v_err    | -0.0100 |  0.0579 | -0.4518 |  0.1016
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.03
tracking_rewards |  -16.64 |    3.80 |  -31.12 |   -9.62
steps    |     380 |  

attitude |    0.03    0.02    0.18 |    1.16    0.66    1.87 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03    0.27 |    0.65    1.86 |   -1.42   -3.11 |    1.51    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.03 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.40
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.97   -0.99 |    1.00    0.99
cs_angles |  0.0018  0.0043 |  0.0747  0.0802 | -0.9651 -0.9931 |  0.9996  0.9876
optical_flow | -0.0000  0.0001 |  0.0239  0.0225 | -1.1933 -1.1204 |  1.1338  1.0350
v_err    | -0.0103 |  0.0581 | -0.4516 |  0.1078
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.08   -0.05   -0.11 |    1.12    0.63    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00    0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04   -0.01 |    0.64    1.83 |   -1.48   -3.10 |    1.45    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.26 |    0.00 |    1.37
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.99 |    0.97    1.00
cs_angles |  0.0001  0.0009 |  0.0765  0.0824 | -0.9822 -0.9868 |  0.9736  0.9951
optical_flow | -0.0000  0.0001 |  0.0233  0.0232 | -1.1509 -1.0556 |  1.1221  1.2092
v_err    | -0.0105 |  0.0580 | -0.4508 |  0.1073
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.00   -0.12 |    0.64    1.76 |   -1.54   -3.10 |    1.51    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.59
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -1.00   -0.98 |    0.98    1.00
cs_angles |  0.0020 -0.0003 |  0.0763  0.0789 | -0.9978 -0.9761 |  0.9811  0.9983
optical_flow | -0.0000  0.0001 |  0.0244  0.0234 | -1.1800 -1.0289 |  0.9931  1.2081
v_err    | -0.0107 |  0.0585 | -0.4524 |  0.0931
landing_rewards |    9.81 |    1.38 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.05 |    0.01
tracking_rewards |  -16.53 |    4.28 |  -37.30 |   -8.82
steps    |     376 |  

attitude |    0.09    0.01   -0.01 |    1.17    0.63    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.02 |    0.63    1.82 |   -1.45   -3.14 |    1.52    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.89
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0022  0.0042 |  0.0765  0.0765 | -0.9968 -0.9915 |  0.9929  0.9977
optical_flow |  0.0001 -0.0001 |  0.0228  0.0226 | -1.0195 -1.0414 |  1.1034  1.1932
v_err    | -0.0103 |  0.0581 | -0.4527 |  0.1096
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01    0.05 |    0.63    1.80 |   -1.46   -3.14 |    1.52    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.37
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.96   -1.00 |    0.99    0.99
cs_angles |  0.0023  0.0032 |  0.0768  0.0785 | -0.9618 -0.9967 |  0.9915  0.9900
optical_flow |  0.0000 -0.0001 |  0.0232  0.0244 | -1.0982 -1.1761 |  1.0649  1.2008
v_err    | -0.0104 |  0.0585 | -0.4524 |  0.1054
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.66 |    3.97 |  -31.21 |   -9.67
steps    |     377 |  

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01    0.03 |    0.68    1.79 |   -1.48   -3.14 |    1.48    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.55
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.98 |    1.00    0.98
cs_angles |  0.0031  0.0016 |  0.0781  0.0767 | -0.9950 -0.9760 |  0.9977  0.9848
optical_flow | -0.0000  0.0000 |  0.0232  0.0229 | -0.9714 -0.9606 |  1.1195  0.9735
v_err    | -0.0105 |  0.0584 | -0.4520 |  0.1095
landing_rewards |    9.81 |    1.38 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -16.73 |    4.23 |  -44.99 |   -9.60
steps    |     376 |  

thrust   |    0.00    0.00   -0.00 |    0.67    0.68    0.68 |   -3.45   -3.30   -3.40 |    3.41    3.45    3.43
norm_thrust |    0.88 |    0.76 |    0.00 |    3.46
fuel     |    1.49 |    0.18 |    1.13 |    2.18
rewards  |  -11.29 |    4.77 |  -34.47 |   -3.50
fuel_rewards |   -4.27 |    0.52 |   -6.25 |   -3.24
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.90 |   13.32 |    0.01 |  321.91
norm_af  |    1.74 |    0.85 |    0.15 |    3.26
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.06    0.01   -0.04 |    1.15    0.69    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.05 |    0.69

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5204   1.2364   5.6113  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0008   0.0031   5.4889   2.1784   2.1397
Update Cnt = 3260    ET =    916.4   Stats:  Mean, Std, Min, Max
r_f      |    0.21  -10.96   11.68 |  179.90  171.78  201.49 | -397.96 -384.18 -396.46 |  388.99  378.28  399.12
v_f      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.10    0.11    0.10
r_i      |   -5.15  -24.47   34.90 |  666.19  651.82  782.18 |-1289.23-1314.70-1283.12 | 1234.60 1324.69 1271.78
v_i      |    0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.09
norm_rf  |    0.16 |    0.07 |    0.02 |    0.45
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.40 |    2.80 |    0.01 |   33.95
thrust   |   -0.00   -0.00   -0.00 |    0.67    0.68    0.67 |   -3.31   -3.44   -3.46 |    3.34    3.41    3.42
norm_thrust |    

ADV1:  -0.0006419061329206078 0.009293799602183126 0.029935269292914457 -0.06476826194854121
ADV2:  0.03510333635718541 0.8333006708482241 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6681   1.1166   5.6836  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0033   5.4889   2.1784   2.1397
***** Episode 101376, Mean R = -10.6  Std R = 5.5  Min R = -25.6
PolicyLoss: -0.0347
Policy_Beta: 0.1
Policy_Entropy: 0.183
Policy_KL: 0.000807
Policy_SD: 0.525
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.73e+07
VF_0_ExplainedVarNew: 0.961
VF_0_ExplainedVarOld: 0.955
VF_0_Loss : 0.000247


ADV1:  0.0022479260230119746 0.006803985776800043 0.054517494781214204 -0.05049656858307666
ADV2:  -0.0038569201441113104 0.8649658444754968 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.1023   3.4352  14.8488  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0018   0.0060   5.4889   2.1784 

***** Episode 101624, Mean R = -11.4  Std R = 4.6  Min R = -23.6
PolicyLoss: -0.0328
Policy_Beta: 0.1
Policy_Entropy: 0.183
Policy_KL: 0.000855
Policy_SD: 0.525
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.74e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 0.000172


ADV1:  -3.736692408869866e-05 0.005646490091167928 0.05917483391921241 -0.05645844936926514
ADV2:  0.0025061070729238857 0.9069420536070161 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3063   1.3672   6.0364  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0018   5.4889   2.1784   2.1397
***** Episode 101655, Mean R = -10.4  Std R = 3.6  Min R = -19.8
PolicyLoss: -0.00463
Policy_Beta: 0.1
Policy_Entropy: 0.182
Policy_KL: 0.00068
Policy_SD: 0.521
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.74e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.000108


ADV1:  0.0015772656740878832 0.00568398252760016

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3480   0.5366   3.4464  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0025   5.4889   2.1784   2.1397
***** Episode 101903, Mean R = -11.0  Std R = 5.5  Min R = -26.1
PolicyLoss: -0.0338
Policy_Beta: 0.1
Policy_Entropy: 0.182
Policy_KL: 0.00209
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.75e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.000213


ADV1:  -0.001988403048087238 0.008782690032947111 0.030293692391206058 -0.06094723314881256
ADV2:  0.04558414291068375 0.8360339209354137 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7622   1.2740   6.5936  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0051   5.4889   2.1784   2.1397
***** Episode 101934, Mean R = -12.4  Std R = 5.0  Min R = -27.4
PolicyLoss: -0.0342
Policy_Beta: 0.1
Policy_Entropy: 0.183
Policy_KL: 0.00104


ADV1:  0.0023547665098753463 0.005240234845020479 0.044403224700258176 -0.03534457631219662
ADV2:  -0.03835532649278139 0.9243999921758688 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8576   0.8393   4.3461  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0017   0.0061   5.4889   2.1784   2.1397
***** Episode 102182, Mean R = -10.0  Std R = 3.5  Min R = -17.2
PolicyLoss: 0.000863
Policy_Beta: 0.1
Policy_Entropy: 0.181
Policy_KL: 0.000716
Policy_SD: 0.526
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.76e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.000309


ADV1:  -0.0010197025108987145 0.00673225920555355 0.05417154242301919 -0.052299182640650754
ADV2:  0.0311611780714577 0.8452386675366684 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3340   1.0442   5.9576  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0007   0.0026   5.4889   2.1784   2

***** Episode 102430, Mean R = -11.6  Std R = 4.7  Min R = -25.0
PolicyLoss: -0.0165
Policy_Beta: 0.1
Policy_Entropy: 0.182
Policy_KL: 0.00077
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 3.77e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.00339


ADV1:  -0.0019305196411897566 0.007731265381139242 0.047382562089695324 -0.05104510553141206
ADV2:  0.038814331514110186 0.862084932499647 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0617   0.9270   4.3636  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0050   5.4889   2.1784   2.1397
***** Episode 102461, Mean R = -12.7  Std R = 5.5  Min R = -24.2
PolicyLoss: -0.025
Policy_Beta: 0.1
Policy_Entropy: 0.181
Policy_KL: 0.00112
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.77e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.0025


ADV1:  0.0016754536317777145 0.00736859992836074 0.033

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5171   1.7962   7.3064  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0019   0.0073   5.4889   2.1784   2.1397
***** Episode 102709, Mean R = -11.4  Std R = 5.2  Min R = -26.0
PolicyLoss: -0.0118
Policy_Beta: 0.1
Policy_Entropy: 0.181
Policy_KL: 0.000904
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.78e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000415


ADV1:  -0.00012007570098591957 0.007711227777895162 0.03954157625400176 -0.07118539890672124
ADV2:  0.032262831619726366 0.7999026158384362 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.9462   2.2561  11.6088  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0021   5.4889   2.1784   2.1397
***** Episode 102740, Mean R = -10.7  Std R = 4.7  Min R = -24.1
PolicyLoss: -0.0359
Policy_Beta: 0.1
Policy_Entropy: 0.182
Policy_KL: 0.000

ADV1:  0.0005856133804275121 0.0068922835798638895 0.04818745355543885 -0.059297129457406915
ADV2:  0.01725797734364211 0.8435015631221089 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1717   0.5264   2.8005  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   5.4889   2.1784   2.1397
***** Episode 102988, Mean R = -10.7  Std R = 5.4  Min R = -30.1
PolicyLoss: -0.0265
Policy_Beta: 0.1
Policy_Entropy: 0.179
Policy_KL: 0.000753
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.79e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.000173


ADV1:  -0.0020838826837088257 0.007587400095743476 0.07713883253703657 -0.060003536750620104
ADV2:  0.046270536993111656 0.8129555750266045 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0406   1.2579   6.1458  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0016   0.0054   5.4889   2.1784  

seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.99 |    0.98    0.98
cs_angles |  0.0045  0.0005 |  0.0736  0.0798 | -0.9902 -0.9937 |  0.9773  0.9842
optical_flow |  0.0000 -0.0000 |  0.0224  0.0220 | -1.0956 -1.2367 |  1.0140  1.2561
v_err    | -0.0102 |  0.0584 | -0.4528 |  0.1022
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.07 |    0.02
tracking_rewards |  -16.49 |    4.78 |  -45.46 |   -9.40
steps    |     378 |      20 |     334 |     418
***** Episode 103267, Mean R = -10.8  Std R = 4.6  Min R = -20.3
PolicyLoss: -0.0272
Policy_Beta: 0.1
Policy_Entropy: 0.179
Policy_KL: 0.00106
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.8e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00078


ADV1:  0.0020567516685206975 0.005634565558276192 0.04902424192741811 -0.06603633246542334
ADV2:  -0.02631960274395472 0.8745008727015943 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u

w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.05   -0.22 |    0.66    1.84 |   -1.55   -3.14 |    1.48    3.14
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.43
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -0.94 |    0.99    0.98
cs_angles |  0.0040  0.0015 |  0.0742  0.0764 | -0.9964 -0.9386 |  0.9890  0.9772
optical_flow |  0.0000  0.0000 |  0.0231  0.0214 | -1.2016 -1.1853 |  1.0646  0.9412
v_err    | -0.0103 |  0.0584 | -0.4521 |  0.0978
landing_rewards |    9.84 |    1.26 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -15.93 |    3.68 |  -27.76 |   -8.60
steps    |     378 |  

w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.14 |    0.64    1.96 |   -1.39   -3.13 |    1.53    3.11
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.58
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.86   -0.97 |    0.99    1.00
cs_angles |  0.0034  0.0010 |  0.0771  0.0773 | -0.8579 -0.9722 |  0.9878  0.9988
optical_flow | -0.0001 -0.0000 |  0.0218  0.0213 | -0.9939 -1.2499 |  1.0470  0.9418
v_err    | -0.0103 |  0.0582 | -0.4526 |  0.1028
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -16.36 |    4.37 |  -38.70 |   -9.29
steps    |     378 |  

w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03   -0.13 |    0.66    1.82 |   -1.57   -3.12 |    1.47    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.51
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.98 |    1.00    0.99
cs_angles |  0.0010  0.0045 |  0.0772  0.0782 | -0.9976 -0.9758 |  0.9966  0.9903
optical_flow |  0.0001 -0.0000 |  0.0245  0.0232 | -0.9982 -1.0254 |  1.1174  1.0799
v_err    | -0.0102 |  0.0579 | -0.4525 |  0.0963
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.05 |    0.01
tracking_rewards |  -16.39 |    4.15 |  -31.71 |   -9.24
steps    |     379 |  

attitude |   -0.03    0.00    0.04 |    1.08    0.66    1.76 |   -3.14   -1.52   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.06 |    0.66    1.75 |   -1.51   -3.14 |    1.48    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.50
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.99 |    0.97    0.98
cs_angles |  0.0009  0.0031 |  0.0740  0.0763 | -0.9933 -0.9868 |  0.9743  0.9839
optical_flow |  0.0001  0.0000 |  0.0226  0.0224 | -1.0636 -1.1610 |  1.1569  1.1684
v_err    | -0.0101 |  0.0580 | -0.4523 |  0.0980
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00   -0.01    0.00 |    0.67    0.67    0.67 |   -3.37   -3.41   -3.44 |    3.42    3.41    3.46
norm_thrust |    0.87 |    0.76 |    0.00 |    3.46
fuel     |    1.50 |    0.18 |    1.12 |    2.12
rewards  |  -10.51 |    4.76 |  -45.70 |   -2.74
fuel_rewards |   -4.29 |    0.53 |   -6.05 |   -3.21
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.19 |   13.85 |    0.00 |  311.12
norm_af  |    1.67 |    0.88 |    0.04 |    3.38
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.07   -0.00   -0.05 |    1.14    0.67    1.75 |   -3.14   -1.53   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.02 |    0.67

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0336   0.7040   3.4688  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0030   5.4889   2.1784   2.1397
Update Cnt = 3390    ET =   1077.1   Stats:  Mean, Std, Min, Max
r_f      |    3.89   -5.50   -1.01 |  191.06  161.03  204.69 | -394.09 -361.21 -365.02 |  375.08  392.94  399.28
v_f      |    0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.10    0.09    0.11
r_i      |  -10.86    6.74   42.71 |  691.03  605.42  804.43 |-1294.35-1329.38-1293.25 | 1341.05 1379.91 1358.06
v_i      |    0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.08    0.09    0.10
norm_rf  |    0.17 |    0.07 |    0.03 |    0.39
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.78 |    3.64 |    0.01 |   41.30
thrust   |    0.00   -0.00   -0.00 |    0.66    0.68    0.67 |   -3.43   -3.40   -3.45 |    3.43    3.41    3.45
norm_thrust |    

ADV1:  -3.089966718894367e-05 0.004807430751991356 0.038250502719125556 -0.03528155508350772
ADV2:  -0.0016851806823140266 0.9044340888924518 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.8625   1.9463   8.6330  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0008   5.4889   2.1784   2.1397
***** Episode 105406, Mean R = -10.2  Std R = 3.1  Min R = -16.9
PolicyLoss: -0.00116
Policy_Beta: 0.1
Policy_Entropy: 0.183
Policy_KL: 0.000827
Policy_SD: 0.519
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.88e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000178


ADV1:  -0.0011895768019940397 0.007924836645724982 0.07503137506135554 -0.060677405086664825
ADV2:  0.037893016749002965 0.7922680893848674 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.5353   1.5441   7.7180  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0031   5.4889   2.178

***** Episode 105654, Mean R = -11.9  Std R = 6.3  Min R = -36.7
PolicyLoss: -0.03
Policy_Beta: 0.1
Policy_Entropy: 0.184
Policy_KL: 0.000825
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.89e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.000539


ADV1:  -0.0005897469020002389 0.00823413428904901 0.06873829492958511 -0.054585235541713815
ADV2:  0.033926187269359025 0.8270711891759932 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.3580   1.2767   6.1748  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0022   5.4889   2.1784   2.1397
***** Episode 105685, Mean R = -9.4  Std R = 5.0  Min R = -25.2
PolicyLoss: -0.0335
Policy_Beta: 0.1
Policy_Entropy: 0.181
Policy_KL: 0.00125
Policy_SD: 0.517
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.89e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.961
VF_0_Loss : 0.000956


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7830   0.8815   4.0072  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0013   5.4889   2.1784   2.1397
***** Episode 105933, Mean R = -11.8  Std R = 6.9  Min R = -33.7
PolicyLoss: -0.0378
Policy_Beta: 0.1
Policy_Entropy: 0.183
Policy_KL: 0.000861
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.9e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 0.00145


ADV1:  0.002669035433216991 0.006020085739366924 0.060048623627888154 -0.070138213023692
ADV2:  -0.028215606801817127 0.8326841530950535 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.0944   2.6217  11.8892  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0023   0.0079   5.4889   2.1784   2.1397
***** Episode 105964, Mean R = -10.4  Std R = 4.5  Min R = -21.8
PolicyLoss: -0.00555
Policy_Beta: 0.1
Policy_Entropy: 0.184
Policy_KL: 0.000719
P

ADV1:  -0.0007400992423546013 0.007141157925597714 0.033546921019840636 -0.07071253027435481
ADV2:  0.04024370126908802 0.7847901572088408 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5731   1.0801   4.8983  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0019   5.4889   2.1784   2.1397
***** Episode 106212, Mean R = -10.7  Std R = 6.4  Min R = -33.7
PolicyLoss: -0.0379
Policy_Beta: 0.1
Policy_Entropy: 0.181
Policy_KL: 0.000532
Policy_SD: 0.523
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.91e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.000776


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.0008191829770545688 0.006927813993496677 0.030568374980027346 -0.05564621289571126
ADV2:  0.017223587972838853 0.8559115838492531 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7012   0.8565   4.5392  24.5266  15.5251  10.0673
ValF

***** Episode 106460, Mean R = -11.4  Std R = 4.5  Min R = -25.0
PolicyLoss: -0.0253
Policy_Beta: 0.1
Policy_Entropy: 0.183
Policy_KL: 0.000867
Policy_SD: 0.533
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.92e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.00314


ADV1:  -0.002497756908716416 0.009211360853242095 0.05430385873191029 -0.07627652776885946
ADV2:  0.04775343501264387 0.8474821172663258 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2591   1.9166   9.4771  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0019   0.0066   5.4889   2.1784   2.1397
***** Episode 106491, Mean R = -11.7  Std R = 5.5  Min R = -26.8
PolicyLoss: -0.0287
Policy_Beta: 0.1
Policy_Entropy: 0.183
Policy_KL: 0.000623
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.92e+07
VF_0_ExplainedVarNew: 0.965
VF_0_ExplainedVarOld: 0.959
VF_0_Loss : 0.000874


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1030   2.0364   8.4360  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0037   5.4889   2.1784   2.1397
***** Episode 106739, Mean R = -10.6  Std R = 3.5  Min R = -18.7
PolicyLoss: -0.0263
Policy_Beta: 0.1
Policy_Entropy: 0.185
Policy_KL: 0.000863
Policy_SD: 0.518
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.93e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 3.82e-05


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.00021811759456116773 0.009135416832819623 0.06062681123404007 -0.05398419414616713
ADV2:  0.0191205730182221 0.8666056125190472 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9217   0.9197   3.9018  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0012   5.4889   2.1784   2.1397
***** Episode 106770, Mean R = -12.2  Std R = 5.1 

ADV1:  -0.0006304698411396836 0.0067065161084970525 0.059745471204229794 -0.0773130254323981
ADV2:  0.03790570446792501 0.7925421064394137 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7111   0.9241   4.9109  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   5.4889   2.1784   2.1397
***** Episode 107018, Mean R = -10.8  Std R = 4.5  Min R = -21.3
PolicyLoss: -0.0354
Policy_Beta: 0.1
Policy_Entropy: 0.184
Policy_KL: 0.00098
Policy_SD: 0.533
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.94e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 4.22e-05


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -7.218949331043908e-05 0.005513096425150192 0.03644951861282847 -0.037752130016774355
ADV2:  0.011374327090183808 0.8920824942014951 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.2990   2.1859  10.1146  24.5266  15.5251  10.0673
Val

cs_angles |  0.0011  0.0027 |  0.0743  0.0772 | -0.9841 -0.9445 |  0.9958  0.9687
optical_flow |  0.0001  0.0001 |  0.0227  0.0223 | -1.2724 -1.0584 |  1.2015  0.9870
v_err    | -0.0097 |  0.0584 | -0.4524 |  0.1013
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.31 |    4.37 |  -42.72 |   -9.08
steps    |     377 |      20 |     334 |     418
***** Episode 107297, Mean R = -9.7  Std R = 5.5  Min R = -27.9
PolicyLoss: -0.0152
Policy_Beta: 0.1
Policy_Entropy: 0.183
Policy_KL: 0.000752
Policy_SD: 0.519
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.95e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 2.48e-05


ADV1:  0.001822966237738062 0.005588190880443338 0.04854571181646522 -0.03463488711885804
ADV2:  -0.021411011964170248 0.8980101724330549 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0302   1.2800   6.0490  24.5266  15.5251  10.0673
ValFun  Gradients: 

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.07 |    0.68    1.78 |   -1.56   -3.08 |    1.49    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.45
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.95 |    0.99    0.98
cs_angles |  0.0020  0.0003 |  0.0764  0.0801 | -0.9936 -0.9496 |  0.9878  0.9780
optical_flow | -0.0001  0.0000 |  0.0224  0.0210 | -1.3122 -0.9082 |  0.9981  1.0383
v_err    | -0.0097 |  0.0585 | -0.4530 |  0.1068
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.49 |    4.42 |  -38.96 |   -9.02
steps    |     377 |  

attitude |   -0.01   -0.00    0.01 |    1.13    0.67    1.79 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01    0.02 |    0.68    1.79 |   -1.43   -3.11 |    1.53    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.63
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.97 |    1.00    0.99
cs_angles |  0.0032  0.0049 |  0.0748  0.0778 | -0.9939 -0.9744 |  0.9986  0.9903
optical_flow |  0.0000  0.0001 |  0.0234  0.0238 | -1.1878 -1.2706 |  1.3107  1.2139
v_err    | -0.0098 |  0.0586 | -0.4534 |  0.1216
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.07    0.02   -0.27 |    1.19    0.69    1.84 |   -3.14   -1.55   -3.14 |    3.14    1.52    3.14
w        |    0.00    0.00   -0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.33 |    0.69    1.82 |   -1.53   -3.13 |    1.41    3.08
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.51
seeker_angles |    0.00    0.00 |    0.08    0.07 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0025  0.0020 |  0.0752  0.0750 | -0.9997 -0.9879 |  0.9944  0.9961
optical_flow |  0.0001 -0.0000 |  0.0220  0.0216 | -0.9719 -1.0681 |  1.1887  1.1557
v_err    | -0.0100 |  0.0583 | -0.4516 |  0.0985
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.00    0.00 |    0.67    0.68    0.67 |   -3.40   -3.46   -3.45 |    3.43    3.45    3.40
norm_thrust |    0.88 |    0.76 |    0.00 |    3.46
fuel     |    1.50 |    0.18 |    1.10 |    2.13
rewards  |  -11.02 |    4.65 |  -30.87 |   -3.54
fuel_rewards |   -4.29 |    0.51 |   -6.09 |   -3.15
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.92 |   12.97 |    0.00 |  312.53
norm_af  |    1.80 |    0.89 |    0.02 |    3.25
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.06    0.01    0.15 |    1.25    0.71    1.88 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.00    0.14 |    0.72

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.2277   3.4071  12.6926  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0004   5.4889   2.1784   2.1397
Update Cnt = 3510    ET =   1170.9   Stats:  Mean, Std, Min, Max
r_f      |  -31.31   -4.17    2.57 |  194.64  168.41  193.46 | -383.52 -385.62 -394.39 |  394.24  388.45  373.56
v_f      |    0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.09 |    0.10    0.10    0.11
r_i      | -104.68  -40.39    0.26 |  718.06  643.45  743.03 |-1354.29-1292.81-1313.28 | 1272.48 1357.60 1334.00
v_i      |    0.01    0.00    0.00 |    0.05    0.04    0.05 |   -0.10   -0.10   -0.09 |    0.09    0.09    0.10
norm_rf  |    0.17 |    0.07 |    0.02 |    0.38
norm_vf  |    0.08 |    0.01 |    0.05 |    0.11
gs_f     |    1.51 |    5.25 |    0.01 |   86.88
thrust   |   -0.00   -0.00   -0.00 |    0.66    0.67    0.67 |   -3.42   -3.39   -3.43 |    3.38    3.40    3.44
norm_thrust |    

ADV1:  0.0005356839114794638 0.0068453731661185955 0.05997508365041554 -0.06381821297392648
ADV2:  0.020070897721642757 0.7925237501562405 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4290   0.6700   2.9643  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0017   5.4889   2.1784   2.1397
***** Episode 109126, Mean R = -12.2  Std R = 5.6  Min R = -30.3
PolicyLoss: -0.0296
Policy_Beta: 0.1
Policy_Entropy: 0.184
Policy_KL: 0.000723
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.02e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 7.26e-05


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.0009465146887248424 0.006613557659843036 0.055306338333728944 -0.05980270189768622
ADV2:  0.04352346098695141 0.7869020666958069 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1889   0.4539   2.3293  24.5266  15.5251  10.0673
Val

***** Episode 109374, Mean R = -11.0  Std R = 4.6  Min R = -23.1
PolicyLoss: -0.0298
Policy_Beta: 0.1
Policy_Entropy: 0.18
Policy_KL: 0.000922
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 4.03e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.000131


ADV1:  -0.00011032062289843208 0.008373922565367982 0.07875809341041906 -0.07517130135665351
ADV2:  0.024642019721492697 0.8240462582925677 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.4997   1.8261   7.7198  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0002   0.0005   5.4889   2.1784   2.1397
***** Episode 109405, Mean R = -11.2  Std R = 4.6  Min R = -22.8
PolicyLoss: -0.0281
Policy_Beta: 0.1
Policy_Entropy: 0.182
Policy_KL: 0.000726
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 4.03e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 9.64e-05


Dynamics: Max Disturbance (m/s^2):  [0.00138293 

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9474   1.6423   8.7417  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0016   0.0062   5.4889   2.1784   2.1397
***** Episode 109653, Mean R = -11.7  Std R = 5.8  Min R = -30.4
PolicyLoss: -0.0356
Policy_Beta: 0.1
Policy_Entropy: 0.183
Policy_KL: 0.000944
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.04e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.971
VF_0_Loss : 0.000273


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.0019368704806129828 0.0050469350678121186 0.036040655304011515 -0.052592287221328915
ADV2:  -0.017012804079613173 0.9140077338682495 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7730   1.1665   6.0934  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0013   0.0050   5.4889   2.1784   2.1397
***** Episode 109684, Mean R = -11.0  Std R =

ADV1:  0.00012130071611033304 0.006183693122194075 0.025846436617221864 -0.05150462766567407
ADV2:  0.02967970746253794 0.8060287033691818 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2327   1.2101   6.6030  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0012   5.4889   2.1784   2.1397
***** Episode 109932, Mean R = -9.4  Std R = 3.5  Min R = -20.3
PolicyLoss: -0.0362
Policy_Beta: 0.1
Policy_Entropy: 0.184
Policy_KL: 0.00106
Policy_SD: 0.512
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.05e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.000413


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.002721605414553247 0.006968110952268142 0.028013073928212284 -0.052396411387715856
ADV2:  0.051395586257675575 0.8399586428620055 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3288   0.9131   4.5843  24.5266  15.5251  10.0673
ValF

***** Episode 110180, Mean R = -10.8  Std R = 5.2  Min R = -23.6
PolicyLoss: -0.0306
Policy_Beta: 0.1
Policy_Entropy: 0.184
Policy_KL: 0.000774
Policy_SD: 0.521
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.06e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 5.41e-05


ADV1:  -0.00038934966604846176 0.009373126048452345 0.04064348665039197 -0.07755258353429059
ADV2:  0.029831142318039315 0.8490459373052297 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0111   1.9067  10.2260  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   5.4889   2.1784   2.1397
***** Episode 110211, Mean R = -11.2  Std R = 4.5  Min R = -22.0
PolicyLoss: -0.0317
Policy_Beta: 0.1
Policy_Entropy: 0.184
Policy_KL: 0.000807
Policy_SD: 0.521
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.06e+07
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.956
VF_0_Loss : 8.7e-05


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.9745   4.0455  15.8997  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   5.4889   2.1784   2.1397
***** Episode 110459, Mean R = -10.6  Std R = 4.5  Min R = -22.3
PolicyLoss: -0.00488
Policy_Beta: 0.1
Policy_Entropy: 0.185
Policy_KL: 0.000588
Policy_SD: 0.525
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 4.07e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 6.16e-05


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.0010435399485570563 0.006912519433046527 0.09763650263006679 -0.05556840310457484
ADV2:  0.027032371687826788 0.8460134128999414 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0937   1.6005   5.9940  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0008   0.0028   5.4889   2.1784   2.1397
***** Episode 110490, Mean R = -11.2  Std R = 4

ADV1:  -0.0009302994687203917 0.006883741771612637 0.04058000052259919 -0.05501577081965686
ADV2:  0.03010472500761236 0.8425338121591831 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1933   0.7193   4.0213  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0008   0.0031   5.4889   2.1784   2.1397
***** Episode 110738, Mean R = -11.7  Std R = 4.9  Min R = -24.7
PolicyLoss: -0.0252
Policy_Beta: 0.1
Policy_Entropy: 0.187
Policy_KL: 0.00097
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.08e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 3.92e-05


Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  0.00029561673927154704 0.008228516193713729 0.042680244326769506 -0.05869428338061984
ADV2:  0.023503127794936064 0.8477979878582139 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6316   0.9856   4.5623  24.5266  15.5251  10.0673
ValF

cs_angles |  0.0020  0.0020 |  0.0731  0.0741 | -0.9535 -0.9968 |  0.9962  0.9750
optical_flow |  0.0000 -0.0001 |  0.0222  0.0241 | -0.9487 -1.1685 |  1.1594  1.0028
v_err    | -0.0104 |  0.0586 | -0.4536 |  0.1122
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.03
tracking_rewards |  -15.89 |    3.59 |  -31.10 |   -9.14
steps    |     376 |      20 |     334 |     417
***** Episode 111017, Mean R = -10.2  Std R = 4.2  Min R = -22.8
PolicyLoss: -0.0212
Policy_Beta: 0.1
Policy_Entropy: 0.184
Policy_KL: 0.000827
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 4.09e+07
VF_0_ExplainedVarNew: 0.962
VF_0_ExplainedVarOld: 0.954
VF_0_Loss : 0.00021


ADV1:  0.00025216922893486326 0.00678145019374635 0.04507403936648563 -0.06792080711747156
ADV2:  0.027982167856899214 0.7917039396438015 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7542   0.9642   5.3475  24.5266  15.5251  10.0673
ValFun  Gradients: 

attitude |   -0.01    0.04    0.04 |    1.23    0.67    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00    0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03    0.06 |    0.67    1.87 |   -1.53   -3.14 |    1.42    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.26 |    0.00 |    1.42
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0025  0.0025 |  0.0760  0.0788 | -0.9995 -0.9958 |  0.9969  0.9975
optical_flow | -0.0000  0.0001 |  0.0239  0.0224 | -1.2340 -1.2790 |  1.2329  1.0528
v_err    | -0.0104 |  0.0586 | -0.4515 |  0.1047
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04   -0.00    0.08 |    1.23    0.66    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.52    3.14
w        |    0.00   -0.00    0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.09 |    0.66    1.90 |   -1.48   -3.13 |    1.47    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.35
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -0.95 |    1.00    0.96
cs_angles |  0.0021  0.0039 |  0.0733  0.0768 | -0.9997 -0.9547 |  0.9992  0.9622
optical_flow | -0.0001  0.0000 |  0.0212  0.0214 | -1.3262 -0.9584 |  0.9611  1.1187
v_err    | -0.0107 |  0.0585 | -0.4533 |  0.0968
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.01    0.01    0.21 |    1.23    0.67    1.92 |   -3.14   -1.55   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01    0.22 |    0.67    1.92 |   -1.54   -3.13 |    1.48    3.14
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.64
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.90 |    0.99    0.98
cs_angles |  0.0035  0.0030 |  0.0773  0.0797 | -0.9813 -0.8973 |  0.9927  0.9849
optical_flow |  0.0000  0.0000 |  0.0231  0.0220 | -1.1240 -0.8804 |  1.0985  1.1731
v_err    | -0.0107 |  0.0585 | -0.4522 |  0.0957
landing_rewards |    9.94 |    0.80 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.09    0.08    0.11 |    1.15    0.63    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.08    0.14 |    0.63    1.88 |   -1.43   -3.11 |    1.46    3.14
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.51
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.96   -1.00 |    0.99    1.00
cs_angles |  0.0008  0.0029 |  0.0745  0.0771 | -0.9595 -0.9961 |  0.9937  0.9975
optical_flow | -0.0000 -0.0000 |  0.0224  0.0238 | -1.0897 -1.1055 |  1.0669  1.0032
v_err    | -0.0108 |  0.0591 | -0.4532 |  0.0917
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.00   -0.00 |    0.67    0.68    0.67 |   -3.30   -3.46   -3.45 |    3.35    3.46    3.44
norm_thrust |    0.88 |    0.76 |    0.00 |    3.46
fuel     |    1.50 |    0.18 |    1.04 |    2.16
rewards  |  -10.69 |    4.62 |  -40.43 |   -3.50
fuel_rewards |   -4.29 |    0.52 |   -6.19 |   -2.97
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.98 |   12.77 |    0.01 |  496.88
norm_af  |    1.76 |    0.95 |    0.06 |    3.27
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.02   -0.01    0.07 |    1.23    0.65    1.88 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.06 |    0.66

ADV1:  -0.00013660643614252466 0.005251230992305219 0.046421141138006605 -0.039511248057822024
ADV2:  -0.0005010352417065705 0.9188253265007634 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.0713   2.4738  10.4874  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0007   5.4889   2.1784   2.1397
Update Cnt = 3640    ET =   1072.6   Stats:  Mean, Std, Min, Max
r_f      |   -5.30  -17.25   -6.75 |  183.54  173.12  204.90 | -383.17 -392.18 -395.69 |  368.61  378.12  379.57
v_f      |    0.00    0.01   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.10    0.09    0.09
r_i      |  -15.84  -76.02    4.05 |  680.02  648.50  771.08 |-1297.71-1354.75-1367.04 | 1318.13 1252.76 1294.10
v_i      |    0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.10 |    0.09    0.09    0.09
norm_rf  |    0.17 |    0.07 |    0.03 |    0.52
norm_vf  |    0.07 |    0.01 |    0.04 |    0.11
gs_f     |    1.37 |    2.

Dynamics: Max Disturbance (m/s^2):  [0.00138293 0.00181235 0.00221757] 0.0031803638227355514
ADV1:  -0.0005819923626741515 0.005098181067446766 0.06170930574435779 -0.042349901931704736
ADV2:  0.0030587165364392554 0.8636819397354099 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2295   0.6770   3.7963  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0007   0.0027   5.4889   2.1784   2.1397
***** Episode 113156, Mean R = -9.7  Std R = 4.7  Min R = -24.6
PolicyLoss: 0.00346
Policy_Beta: 0.1
Policy_Entropy: 0.186
Policy_KL: 0.000679
Policy_SD: 0.523
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 4.17e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 1.97e-05


ADV1:  0.00020979740439992672 0.005030919550241594 0.04829953191410147 -0.03555490893124347
ADV2:  -0.0008765745405756132 0.9166767409984207 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   6.4300   4.9627  17.7038  24.5266  15.5251  10.0673
V

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0040   0.0023   0.0079   5.4889   2.1784   2.1397
***** Episode 113404, Mean R = -10.0  Std R = 3.8  Min R = -18.2
PolicyLoss: -0.0277
Policy_Beta: 0.1
Policy_Entropy: 0.189
Policy_KL: 0.000853
Policy_SD: 0.516
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 4.18e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 5.4e-05


ADV1:  0.002076927404287503 0.005024384892880948 0.03631355003489933 -0.08669429567075931
ADV2:  -0.01623719333084402 0.841100978954214 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3912   0.5256   3.1503  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0054   5.4889   2.1784   2.1397
***** Episode 113435, Mean R = -9.5  Std R = 3.9  Min R = -22.4
PolicyLoss: -0.0181
Policy_Beta: 0.1
Policy_Entropy: 0.187
Policy_KL: 0.000923
Policy_SD: 0.509
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 4.18e+07
VF_0_ExplainedVarNew: 0.99
VF_

ADV1:  0.002053476158489553 0.00482313516303057 0.050603504790416254 -0.056415451460025634
ADV2:  -0.03070700339993643 0.8980196005006242 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.8211   4.3027  15.3362  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0015   0.0053   5.4889   2.1784   2.1397
***** Episode 113683, Mean R = -9.8  Std R = 3.2  Min R = -18.7
PolicyLoss: -0.00465
Policy_Beta: 0.1
Policy_Entropy: 0.187
Policy_KL: 0.000888
Policy_SD: 0.526
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 4.19e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000186


ADV1:  -0.002045182765528093 0.004891517938525467 0.028344706298587347 -0.056188002649849744
ADV2:  0.037637055770402175 0.8857148005127242 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5436   0.8464   4.7206  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0015   0.0054   5.4889   2.1784   2

***** Episode 113931, Mean R = -10.0  Std R = 4.3  Min R = -20.9
PolicyLoss: -0.00333
Policy_Beta: 0.1
Policy_Entropy: 0.187
Policy_KL: 0.00089
Policy_SD: 0.511
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 4.2e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.000298


ADV1:  -0.001887036475310363 0.007251725671642787 0.03125781841267483 -0.09525606241183804
ADV2:  0.04291206382234533 0.8143306695605993 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6008   1.6473   8.3861  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0016   0.0053   5.4889   2.1784   2.1397
***** Episode 113962, Mean R = -10.9  Std R = 4.4  Min R = -22.5
PolicyLoss: -0.0311
Policy_Beta: 0.1
Policy_Entropy: 0.187
Policy_KL: 0.000669
Policy_SD: 0.521
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 4.2e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.000654


ADV1:  0.002171314660265501 0.006386116783396 0.045858

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7481   0.7279   3.6067  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0005   0.0016   5.4889   2.1784   2.1397
***** Episode 114210, Mean R = -11.1  Std R = 4.0  Min R = -19.8
PolicyLoss: -0.0201
Policy_Beta: 0.1
Policy_Entropy: 0.186
Policy_KL: 0.000652
Policy_SD: 0.524
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 4.21e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00053


ADV1:  -0.0007194145552916794 0.005611223221290699 0.048923214561095746 -0.051598485484628254
ADV2:  0.0066454708982572 0.8760451848604492 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2026   0.4659   3.1790  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   5.4889   2.1784   2.1397
***** Episode 114241, Mean R = -11.2  Std R = 4.3  Min R = -18.9
PolicyLoss: -0.00216
Policy_Beta: 0.1
Policy_Entropy: 0.185
Policy_KL: 0.0009

ADV1:  0.00019133591149340305 0.00738084765014402 0.10068400621695861 -0.10988059461160904
ADV2:  0.016246825507808413 0.841463959620969 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4207   0.7911   4.1000  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0008   5.4889   2.1784   2.1397
***** Episode 114489, Mean R = -12.0  Std R = 6.9  Min R = -30.0
PolicyLoss: -0.0217
Policy_Beta: 0.1
Policy_Entropy: 0.185
Policy_KL: 0.00094
Policy_SD: 0.532
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.22e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 7.62e-05


ADV1:  0.0030780448800870183 0.005303564745202451 0.07885408179505116 -0.03395888755662374
ADV2:  -0.047361851960171515 0.9002092081744205 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   8.5217   6.1833  18.0775  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0046   0.0024   0.0080   5.4889   2.1784   2.1

***** Episode 114737, Mean R = -10.3  Std R = 4.4  Min R = -18.0
PolicyLoss: 0.00813
Policy_Beta: 0.1
Policy_Entropy: 0.187
Policy_KL: 0.000646
Policy_SD: 0.522
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 4.23e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.000314


ADV1:  -0.0005755351095423942 0.005083928529665981 0.038563616601322015 -0.07689460626332312
ADV2:  0.014741708169749967 0.8794699243048218 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7553   0.7082   3.6281  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0004   0.0015   5.4889   2.1784   2.1397
***** Episode 114768, Mean R = -9.1  Std R = 3.4  Min R = -17.4
PolicyLoss: -0.0102
Policy_Beta: 0.1
Policy_Entropy: 0.186
Policy_KL: 0.00115
Policy_SD: 0.522
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 4.23e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.000222


ADV1:  0.0003639497493438546 0.005160667372735684

cs_angles |  0.0045  0.0033 |  0.0754  0.0773 | -0.9931 -0.9981 |  0.9976  0.9907
optical_flow |  0.0000  0.0000 |  0.0223  0.0221 | -1.1779 -1.2356 |  1.1989  0.9695
v_err    | -0.0102 |  0.0586 | -0.4517 |  0.0967
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.28 |    4.44 |  -49.50 |   -9.55
steps    |     377 |      20 |     336 |     420
***** Episode 115047, Mean R = -10.9  Std R = 5.1  Min R = -29.3
PolicyLoss: -0.0174
Policy_Beta: 0.1
Policy_Entropy: 0.185
Policy_KL: 0.00104
Policy_SD: 0.523
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 4.24e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.00286


ADV1:  -0.00014107825427328363 0.0074529393688819055 0.03342953747046801 -0.11143122268559191
ADV2:  0.026537377638417806 0.8287240825414227 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8466   1.5645   8.3153  24.5266  15.5251  10.0673
ValFun  Gradients

theta_cv |    0.22 |    0.25 |    0.00 |    1.48
seeker_angles |    0.01    0.00 |    0.07    0.08 |   -0.99   -1.00 |    0.98    0.98
cs_angles |  0.0051  0.0026 |  0.0729  0.0819 | -0.9866 -0.9980 |  0.9766  0.9776
optical_flow |  0.0001 -0.0000 |  0.0225  0.0223 | -0.9437 -1.1185 |  1.0162  1.1306
v_err    | -0.0100 |  0.0582 | -0.4521 |  0.4931
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |    0.97 |   17.53 |   -0.06 |  309.08
tracking_rewards |  -16.28 |    4.51 |  -56.07 |   -8.75
steps    |     376 |      23 |     190 |     421
***** Episode 115357, Mean R = -11.5  Std R = 5.2  Min R = -28.1
PolicyLoss: -0.0244
Policy_Beta: 0.1
Policy_Entropy: 0.183
Policy_KL: 0.000701
Policy_SD: 0.529
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 4.26e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 4.35e-05


ADV1:  0.0010363430006610434 0.005920919962088725 0.039265647912053225 -0.05184701934162189
ADV2:  -0.0022154811300097916 0.914914561

attitude |    0.04    0.02    0.11 |    1.14    0.67    1.79 |   -3.14   -1.54   -3.14 |    3.14    1.53    3.14
w        |    0.00    0.00   -0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.11 |    0.67    1.80 |   -1.54   -3.14 |    1.52    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.69
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -1.00 |    0.99    0.97
cs_angles |  0.0042  0.0024 |  0.0759  0.0783 | -0.9786 -0.9953 |  0.9893  0.9726
optical_flow |  0.0000 -0.0000 |  0.0232  0.0223 | -1.1943 -1.1662 |  1.1687  1.0439
v_err    | -0.0101 |  0.0580 | -0.4526 |  0.0992
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00    0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.06    0.00 |    0.65    1.82 |   -1.45   -3.14 |    1.48    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.49
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -1.00   -1.00 |    0.99    0.99
cs_angles |  0.0042 -0.0023 |  0.0758  0.0750 | -0.9959 -0.9983 |  0.9862  0.9878
optical_flow |  0.0001  0.0001 |  0.0229  0.0223 | -1.2128 -1.0964 |  1.1570  1.1794
v_err    | -0.0102 |  0.0583 | -0.4537 |  0.0945
landing_rewards |    9.87 |    1.13 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -16.01 |    3.77 |  -31.06 |   -9.21
steps    |     379 |  

attitude |   -0.01    0.08   -0.08 |    1.20    0.65    1.86 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.10   -0.07 |    0.65    1.85 |   -1.38   -3.14 |    1.56    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.56
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    0.98
cs_angles |  0.0016  0.0023 |  0.0767  0.0759 | -0.9858 -0.9923 |  0.9994  0.9798
optical_flow | -0.0000 -0.0000 |  0.0237  0.0226 | -1.4170 -1.0777 |  1.2841  1.0838
v_err    | -0.0103 |  0.0588 | -0.4507 |  0.0990
landing_rewards |    9.87 |    1.13 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.03   -0.02   -0.05 |    1.13    0.67    1.80 |   -3.14   -1.48   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03   -0.04 |    0.67    1.79 |   -1.35   -3.14 |    1.47    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.03    0.03    0.03
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.26 |    0.00 |    1.53
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.95   -0.98 |    0.99    0.99
cs_angles |  0.0030  0.0038 |  0.0766  0.0808 | -0.9453 -0.9812 |  0.9945  0.9924
optical_flow |  0.0000  0.0001 |  0.0223  0.0221 | -1.0987 -1.1194 |  1.0130  1.0247
v_err    | -0.0103 |  0.0587 | -0.4524 |  0.1025
landing_rewards |    9.81 |    1.38 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00    0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03   -0.06 |    0.65    1.86 |   -1.47   -3.12 |    1.49    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.26 |    0.00 |    1.53
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    0.98    0.99
cs_angles |  0.0029  0.0018 |  0.0804  0.0797 | -0.9944 -0.9868 |  0.9792  0.9905
optical_flow | -0.0001  0.0000 |  0.0216  0.0213 | -1.0981 -1.1666 |  1.0670  0.9170
v_err    | -0.0102 |  0.0586 | -0.4536 |  0.1038
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.78 |    4.20 |  -39.46 |  -10.09
steps    |     377 |  

w        |    0.00    0.00    0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04   -0.12 |    0.61    1.91 |   -1.55   -3.13 |    1.45    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.01 |    0.03    0.03    0.04
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.45
seeker_angles |    0.00    0.00 |    0.08    0.07 |   -0.97   -1.00 |    0.98    0.99
cs_angles |  0.0031  0.0011 |  0.0759  0.0742 | -0.9733 -0.9989 |  0.9816  0.9930
optical_flow |  0.0001  0.0001 |  0.0223  0.0229 | -1.0018 -0.9440 |  1.1173  1.1038
v_err    | -0.0103 |  0.0587 | -0.4529 |  0.0966
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.02 |    3.96 |  -34.23 |   -8.73
steps    |     378 |  

attitude |   -0.05   -0.04   -0.02 |    1.26    0.69    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04   -0.06 |    0.68    1.89 |   -1.47   -3.14 |    1.44    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.94 |    0.99    1.00
cs_angles |  0.0043  0.0041 |  0.0730  0.0758 | -0.9911 -0.9402 |  0.9916  0.9955
optical_flow | -0.0000  0.0001 |  0.0229  0.0221 | -1.1242 -1.1137 |  1.0667  1.1647
v_err    | -0.0101 |  0.0584 | -0.4517 |  0.1075
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00    0.00 |    0.00    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.00   -0.11 |    0.66    1.78 |   -1.41   -3.13 |    1.49    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.01   -0.02 |    0.02    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.93   -1.00 |    0.98    1.00
cs_angles |  0.0024  0.0027 |  0.0765  0.0767 | -0.9322 -0.9981 |  0.9838  0.9998
optical_flow |  0.0001  0.0001 |  0.0232  0.0219 | -1.1035 -1.1377 |  0.9618  0.9472
v_err    | -0.0099 |  0.0581 | -0.4588 |  0.1098
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.07 |    0.01
tracking_rewards |  -16.37 |    4.22 |  -40.05 |   -9.58
steps    |     379 |  

thrust   |    0.00   -0.00   -0.00 |    0.66    0.68    0.68 |   -3.44   -3.45   -3.40 |    3.45    3.37    3.39
norm_thrust |    0.88 |    0.76 |    0.00 |    3.46
fuel     |    1.49 |    0.18 |    1.00 |    2.14
rewards  |  -10.72 |    5.31 |  -53.46 |   -3.42
fuel_rewards |   -4.26 |    0.52 |   -6.13 |   -2.86
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.23 |   13.29 |    0.00 |  396.70
norm_af  |    1.71 |    0.95 |    0.04 |    3.36
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.02    0.01    0.28 |    1.23    0.66    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.20 |    0.67

ADV1:  0.00020761646738108407 0.005538785645435137 0.0492527490819783 -0.055824488021200214
ADV2:  0.005762446489925569 0.8940243912166501 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2588   1.1111   4.9335  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0012   5.4889   2.1784   2.1397
Update Cnt = 3820    ET =    993.8   Stats:  Mean, Std, Min, Max
r_f      |  -12.87   -8.88   11.54 |  175.61  163.47  209.98 | -379.69 -369.73 -370.38 |  367.84  394.44  385.46
v_f      |    0.01   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.10 |    0.10    0.08    0.09
r_i      |  -75.45    6.19   22.71 |  663.79  618.22  803.49 |-1327.88-1262.78-1293.39 | 1319.88 1309.58 1307.17
v_i      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.09 |    0.09    0.09    0.10
norm_rf  |    0.16 |    0.07 |    0.03 |    0.49
norm_vf  |    0.08 |    0.01 |    0.04 |    0.11
gs_f     |    1.52 |    2.26 | 

***** Episode 118705, Mean R = -10.4  Std R = 3.6  Min R = -22.4
PolicyLoss: -0.0216
Policy_Beta: 0.1
Policy_Entropy: 0.187
Policy_KL: 0.000921
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.14e+04
TotalSteps: 4.38e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 3.47e-05


ADV1:  -0.001703062024949134 0.005468190598402244 0.07129016658786586 -0.03490051674032629
ADV2:  0.02249584122837901 0.9114197608354718 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1490   0.8612   4.4448  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0012   0.0045   5.4889   2.1784   2.1397
***** Episode 118736, Mean R = -10.9  Std R = 5.3  Min R = -24.9
PolicyLoss: -0.00135
Policy_Beta: 0.1
Policy_Entropy: 0.186
Policy_KL: 0.000887
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.38e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 5.02e-05


ADV1:  -0.002369354736736781 0.009865853856416276 

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6465   0.2367   1.1287  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0050   5.4889   2.1784   2.1397
***** Episode 118984, Mean R = -11.4  Std R = 5.2  Min R = -29.9
PolicyLoss: -0.0334
Policy_Beta: 0.1
Policy_Entropy: 0.186
Policy_KL: 0.000599
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 4.39e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.000109


ADV1:  6.283686253751356e-05 0.005215961444008013 0.029442296822865845 -0.056159702000610434
ADV2:  0.022100085039685663 0.8485458314373714 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4495   0.6249   3.1998  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0020   5.4889   2.1784   2.1397
***** Episode 119015, Mean R = -10.0  Std R = 5.7  Min R = -31.6
PolicyLoss: -0.0273
Policy_Beta: 0.1
Policy_Entropy: 0.189
Policy_KL: 0.000

ADV1:  -0.0009881301394899819 0.008215446544733452 0.03354702816300609 -0.06287532862508234
ADV2:  0.03331116611716802 0.8513816849920538 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9903   1.3388   6.8244  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0025   5.4889   2.1784   2.1397
***** Episode 119263, Mean R = -11.0  Std R = 5.2  Min R = -24.8
PolicyLoss: -0.03
Policy_Beta: 0.1
Policy_Entropy: 0.187
Policy_KL: 0.00106
Policy_SD: 0.526
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 4.4e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 0.000115


ADV1:  -0.0004895181168705963 0.006876956440649977 0.03378612536105435 -0.05191643773192989
ADV2:  0.021671586635821413 0.8765755869070628 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0132   1.1726   5.5995  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   5.4889   2.1784   2.139

***** Episode 119511, Mean R = -11.0  Std R = 5.5  Min R = -22.2
PolicyLoss: -0.0314
Policy_Beta: 0.1
Policy_Entropy: 0.187
Policy_KL: 0.000794
Policy_SD: 0.526
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 4.41e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 4.49e-05


ADV1:  -0.0015525760033783115 0.007909329601651287 0.03973796033571747 -0.10208320700611151
ADV2:  0.047297538061461905 0.7719957318417503 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0550   0.8686   4.4040  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0012   0.0042   5.4889   2.1784   2.1397
***** Episode 119542, Mean R = -11.6  Std R = 7.1  Min R = -39.8
PolicyLoss: -0.0372
Policy_Beta: 0.1
Policy_Entropy: 0.186
Policy_KL: 0.001
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 4.41e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 5.16e-05


ADV1:  -0.0012857488134607646 0.010125887610792757 0.

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.1377   2.8329  11.4467  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0011   0.0047   5.4889   2.1784   2.1397
***** Episode 119790, Mean R = -11.3  Std R = 4.6  Min R = -23.2
PolicyLoss: -0.0102
Policy_Beta: 0.1
Policy_Entropy: 0.188
Policy_KL: 0.00111
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.42e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00116


ADV1:  0.0005693727664750979 0.005197299830767494 0.04540588831070619 -0.03403566052163809
ADV2:  -0.008513029841811036 0.9122052577772681 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.6109   2.2121  10.0381  24.5266  15.5251  10.0673
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0023   5.4889   2.1784   2.1397
***** Episode 119821, Mean R = -9.8  Std R = 4.0  Min R = -20.6
PolicyLoss: -0.00236
Policy_Beta: 0.1
Policy_Entropy: 0.187
Policy_KL: 0.001
Po

In [6]:
fname = "optimize_WATTVW_FOV-AR=5-RPT3"
policy.save_params(fname)


In [5]:
env.test_policy_batch(agent,5000,print_every=100,test_mode=True)

worked 1


KeyboardInterrupt: 