# Test Recurrent Policy with Extreme Parameter Variation 

In [1]:
import numpy as np
import os,sys



sys.path.append('../../../RL_lib/Agents')
sys.path.append('../../../RL_lib/Policies/PPO')
sys.path.append('../../../RL_lib/Policies/Common')
sys.path.append('../../../RL_lib/Utils')
sys.path.append('../../../Env')
sys.path.append('../../../Imaging')


%load_ext autoreload
%load_ext autoreload
%autoreload 2
%matplotlib nbagg
import os
print(os.getcwd())

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
/Users/briangaudet/Study/Subjects/MachineLearning/Projects/Asteroid_CPO_seeker-master/Experiments/Extended/Optimize_HF


In [2]:
%%html
<style>
.output_wrapper, .output {
    height:auto !important;
    max-height:1000px;  /* your desired max-height here */
}
.output_scroll {
    box-shadow:none !important;
    webkit-box-shadow:none !important;
}
</style>

# Optimize Policy

In [3]:
from env import Env
import env_utils as envu
from dynamics_model import Dynamics_model
from lander_model import Lander_model
from ic_gen import Landing_icgen
import rl_utils
import attitude_utils as attu
import optics_utils as optu
from arch_policy_vf import Arch

from policy_ppo import Policy
from softmax_pd import Softmax_pd as PD
from value_function import Value_function

import policy_nets as policy_nets
import valfunc_nets as valfunc_nets


from agent import Agent


import torch.nn as nn

from flat_constraint import Flat_constraint
from glideslope_constraint import Glideslope_constraint
from rh_constraint import RH_constraint
from no_attitude_constraint import Attitude_constraint
from w_constraint import W_constraint
from reward_attitude import Reward
from asteroid_hfr import Asteroid

from thruster_model_cubesat import Thruster_model

from sensor import Sensor
from seeker import Seeker

landing_site_range = 0.0
landing_site = None #np.asarray([-250.,0.,0.])

asteroid_model = Asteroid(landing_site_override=landing_site, omega_range=(1e-5,5e-4))

ap = attu.Quaternion_attitude()

C_cb = optu.rotate_optical_axis(0.0, 0.0, np.pi)
r_cb = np.asarray([0,0,0])
fov=envu.deg2rad(90)
seeker = Seeker(attitude_parameterization=ap, C_cb=C_cb, r_cb=r_cb,
                radome_slope_bounds=(-0.05,0.05), range_bias=(-0.05,0.05),
                   fov=fov, debug=False)
sensor = Sensor(seeker, attitude_parameterization=ap,  use_range=True, apf_tau1=300, use_dp=False,
                      landing_site_range=landing_site_range,
                      pool_type='max', state_type=Sensor.optflow_state_range_dp1)
print(sensor.track_func)
sensor.track_func = sensor.track_func1
print(sensor.track_func)
logger = rl_utils.Logger()
dynamics_model = Dynamics_model(h=2)
thruster_model = Thruster_model(pulsed=True, scale=1.0, offset=0.4)
lander_model = Lander_model(asteroid_model, thruster_model, attitude_parameterization=ap, sensor=sensor, 
                             landing_site_range=landing_site_range, com_range=(-0.10,0.10),
                              attitude_bias=0.05, omega_bias=0.05)

lander_model.get_state_agent = lander_model.get_state_agent_sensor_att_w2

obs_dim = 13
action_dim = 12
actions_per_dim = 2
logit_dim = action_dim * actions_per_dim

recurrent_steps = 60

reward_object = Reward(landing_rlimit=2, landing_vlimit=0.1, 
                       tracking_bias=0.01, fov_coeff=-50., 
                       att_coeff=-0.20,
                       tracking_coeff=-0.5, magv_coeff=-1.0,
                       fuel_coeff=-0.10,  landing_coeff=10.0)

glideslope_constraint = Glideslope_constraint(gs_limit=-1.0)
shape_constraint = Flat_constraint()
attitude_constraint = Attitude_constraint(ap)
w_constraint = W_constraint(w_limit=(0.1,0.1,0.1), w_margin=(0.05,0.05,0.05))
rh_constraint = RH_constraint(rh_limit=150)

wi=0.05
ic_gen = Landing_icgen((800,1000), 
                           p_engine_fail=0.5,
                           engine_fail_scale=(0.5,1.0),
                           lander_wll=(-wi,-wi,-wi),
                           lander_wul=(wi,wi,wi),
                           attitude_parameterization=ap,
                           position_error=(0,np.pi/4),
                           heading_error=(0,np.pi/8),
                           attitude_error=(0,np.pi/16),
                           min_mass=450, max_mass=500,
                           mag_v=(0.05,0.1),
                           debug=False,
                           inertia_uncertainty_diag=10.0,
                           inertia_uncertainty_offdiag=1.0)

env = Env(ic_gen, lander_model, dynamics_model, logger,
          landing_site_range=landing_site_range,
          debug_done=False,
          reward_object=reward_object,
          glideslope_constraint=glideslope_constraint,
          attitude_constraint=attitude_constraint,
          w_constraint=w_constraint,
          rh_constraint=rh_constraint,
          tf_limit=5000.0,print_every=10,nav_period=6)




env.ic_gen.show()

arch = Arch()

policy = Policy(policy_nets.GRU1(obs_dim, logit_dim, recurrent_steps=recurrent_steps), 
                PD(action_dim, actions_per_dim),
                shuffle=False,
                kl_targ=0.001,epochs=20, beta=0.1, servo_kl=True, max_grad_norm=30, scale_vector_obs=True,
                init_func=rl_utils.xn_init)
value_function = Value_function(valfunc_nets.GRU1(obs_dim, recurrent_steps=recurrent_steps), scale_obs=True,
                                shuffle=False, batch_size=9999999, max_grad_norm=30, 
                                verbose=False)

agent = Agent(arch, policy, value_function, None, env, logger,
              policy_episodes=30, policy_steps=3000, gamma1=0.95, gamma2=0.995, 
              recurrent_steps=recurrent_steps, monitor=env.rl_stats)
agent.train(120000)

Quaternion_attitude
Euler321 Attitude
C_cb: 
[[ 1.0000000e+00  0.0000000e+00 -0.0000000e+00]
 [ 0.0000000e+00 -1.0000000e+00  1.2246468e-16]
 [ 0.0000000e+00 -1.2246468e-16 -1.0000000e+00]]
[ 0.0000000e+00 -1.2246468e-16 -1.0000000e+00]
using max  pooling
V4: Output State type:  <function Sensor.optflow_state_range_dp1 at 0x1371e5488>
<bound method Sensor.track_func1 of <sensor.Sensor object at 0x126080748>>
<bound method Sensor.track_func1 of <sensor.Sensor object at 0x126080748>>
6dof dynamics model 
thruster model: 
Inertia Tensor:  [[333.33333333   0.           0.        ]
 [  0.         333.33333333   0.        ]
 [  0.           0.         333.33333333]]
Lander Model: 
Reward_terminal equator
queue fixed
Flat Constraint
Attitude Constraint
Rotational Velocity Constraint
Position Hysterises Constraint


<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

lander env RHL
Landing_icgen:
[[-1.]
 [ 1.]]
Policy with vectorized sample
	xn_init: layer  Linear(in_features=13, out_features=130, bias=True)
	xn_init: layer  GRUCell(130, 176)
	xn_init: layer  Linear(in_features=176, out_features=240, bias=True)
	xn_init: layer  Linear(in_features=240, out_features=24, bias=True)
Policy: recurrent steps > 1, disabling shuffle
	Test Mode:          False
	Clip Param:         0.1
	Shuffle :           False
	Shuffle by Chunks:  False
	Max Grad Norm:      30
	Recurrent Steps:    60
	Rollout Limit:      1
	Advantage Func:     <advantage_utils.Adv_default object at 0x1392412e8>
	Advantage Norm:     <function Adv_normalizer.apply at 0x136473488>
	PD:                 <softmax_pd.Softmax_pd object at 0x139272cf8>
	Loss Function:      <bound method Policy.calc_loss1 of <policy_ppo.Policy object at 0x139241128>>
Value Funtion
	xn_init: layer  Linear(in_features=13, out_features=130, bias=True)
	xn_init: layer  GRUCell(130, 25)
	xn_init: layer  Linear(in_feature

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0908   0.0137   0.1112   0.1706   0.1185   0.0326
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1323   0.0499   0.2223   6.6368   2.2852   2.4929
***** Episode 232, Mean R = -248.7  Std R = 118.8  Min R = -614.5
PolicyLoss: -0.0162
Policy_Beta: 0.0667
Policy_Entropy: 0.000338
Policy_KL: 0.00171
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 4.16e+03
TotalSteps: 2.31e+04
VF_0_ExplainedVarNew: 0.0481
VF_0_ExplainedVarOld: 0.0348
VF_0_Loss : 0.791


ADV1:  0.10459785547816118 0.7741979399083201 0.9317905397950565 -3.7207600916509547
ADV2:  -0.00210972955699054 0.8600819829588422 0.972768306354263 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0949   0.0179   0.1160   0.1706   0.1185   0.0326
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1509   0.0668   0.2718   6.6368   2.2852   2.4929
***** Episode 263, Mean R = -290.3  Std R = 116.5  Min R = -527.8
PolicyLoss: -0.0272
Policy_Beta: 0.0667
Policy_Entropy: 0.000339
Po

*** RH VIO  CNT:  100
ADV1:  0.055398244378806596 0.4403399680610698 0.6630137868314778 -3.971694825425465
ADV2:  0.03778105678180067 0.7028407378969423 1.3239704794576028 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0631   0.0148   0.0865   0.1929   0.1292   0.0422
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0567   0.0273   0.1207   6.6368   2.2852   2.4929
***** Episode 511, Mean R = -433.3  Std R = 192.2  Min R = -866.0
PolicyLoss: -0.0537
Policy_Beta: 0.0667
Policy_Entropy: 0.000358
Policy_KL: 0.0013
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 9.9e+03
TotalSteps: 8.63e+04
VF_0_ExplainedVarNew: 0.223
VF_0_ExplainedVarOld: 0.192
VF_0_Loss : 0.192


ADV1:  -0.059338713334235016 0.3975504991163678 1.0014410096614967 -4.070309733637911
ADV2:  0.05469723629728681 0.7128271624576608 2.577041343464021 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0677   0.0216   0.0982   0.1929   0.1292   0.0422
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0631   0.0

***** Episode 759, Mean R = -462.7  Std R = 162.2  Min R = -751.4
PolicyLoss: -0.0404
Policy_Beta: 0.0667
Policy_Entropy: 0.000376
Policy_KL: 0.000983
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 1.09e+04
TotalSteps: 1.71e+05
VF_0_ExplainedVarNew: 0.458
VF_0_ExplainedVarOld: 0.426
VF_0_Loss : 0.108


ADV1:  -0.008678341446833002 0.2265202295287919 1.5706581449508668 -3.706275672342862
ADV2:  0.024481564437715892 0.800616136110015 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0942   0.0295   0.1505   0.1929   0.1292   0.0422
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0233   0.0078   0.0356   6.6368   2.2852   2.4929
***** Episode 790, Mean R = -504.2  Std R = 164.6  Min R = -936.5
PolicyLoss: -0.0263
Policy_Beta: 0.0667
Policy_Entropy: 0.000382
Policy_KL: 0.000934
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 1.23e+04
TotalSteps: 1.83e+05
VF_0_ExplainedVarNew: 0.56
VF_0_ExplainedVarOld: 0.523
VF_0_Loss : 0.0678


ADV1:  0.004670805776760575 0.18720475258761113 0.46930

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0917   0.0251   0.1491   0.1929   0.1292   0.0422
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0256   0.0111   0.0506   6.6368   2.2852   2.4929
***** Episode 1038, Mean R = -428.7  Std R = 183.0  Min R = -1026.3
PolicyLoss: -0.0349
Policy_Beta: 0.0667
Policy_Entropy: 0.000392
Policy_KL: 0.000958
Policy_SD: 0.954
Policy_lr_mult: 1
Steps: 1.02e+04
TotalSteps: 2.72e+05
VF_0_ExplainedVarNew: 0.619
VF_0_ExplainedVarOld: 0.6
VF_0_Loss : 0.0651


ADV1:  0.018500421167286868 0.17160929696929308 1.903180686632792 -1.2867001944487515
ADV2:  0.0027601305985034542 0.8309633319220854 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0881   0.0107   0.1075   0.1929   0.1292   0.0422
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0242   0.0101   0.0499   6.6368   2.2852   2.4929
***** Episode 1069, Mean R = -470.8  Std R = 194.8  Min R = -867.4
PolicyLoss: -0.0155
Policy_Beta: 0.0667
Policy_Entropy: 0.000388
Policy_KL: 0.

ADV1:  0.02166605419479835 0.1807659100089284 1.0195194466908772 -1.2875519392124177
ADV2:  0.012858463993422673 0.8505687239562314 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1140   0.0314   0.1868   0.2810   0.1468   0.0589
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0308   0.0147   0.0691   6.6368   2.2852   2.4929
***** Episode 1317, Mean R = -458.5  Std R = 208.5  Min R = -982.0
PolicyLoss: -0.0285
Policy_Beta: 0.0667
Policy_Entropy: 0.000402
Policy_KL: 0.00111
Policy_SD: 0.953
Policy_lr_mult: 1
Steps: 1.12e+04
TotalSteps: 3.73e+05
VF_0_ExplainedVarNew: 0.693
VF_0_ExplainedVarOld: 0.662
VF_0_Loss : 0.0489


ADV1:  -0.01954149229253297 0.1585797165492669 0.4414117802930553 -1.3777487285956225
ADV2:  0.034215372193230814 0.8490963026069152 2.8146570006665006 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0984   0.0202   0.1457   0.2810   0.1468   0.0589
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0237   0.0116   0.0542   6.6368   2.2852

optical_flow |  0.0000 -0.0000 |  0.0021  0.0021 | -0.0146 -0.0181 |  0.0286  0.0206
v_err    | -0.4481 |  0.1720 | -1.1589 |  0.7669
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  858.67 |  281.42 |   87.46 | 1430.65
tracking_rewards | -407.81 |  154.86 | -893.93 | -150.83
steps    |     386 |     142 |     138 |     834
***** Episode 1596, Mean R = -475.2  Std R = 138.1  Min R = -901.1
PolicyLoss: -0.0148
Policy_Beta: 0.0667
Policy_Entropy: 0.000445
Policy_KL: 0.00134
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 1.24e+04
TotalSteps: 4.82e+05
VF_0_ExplainedVarNew: 0.794
VF_0_ExplainedVarOld: 0.772
VF_0_Loss : 0.0517


ADV1:  0.0007537251928602936 0.15874918689243825 1.3522370131810506 -1.338937284151715
ADV2:  0.019257109983073322 0.8282971026168868 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1853   0.0546   0.3096   0.3096   0.1853   0.0589
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0201   0.0056   0.0348   6.6368   2.2852   2.4929


w        |   -0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.10   -0.08   -0.10 |    0.08    0.09    0.08
a_f      |   -0.05   -0.21 |    0.71    1.80 |   -1.45   -3.13 |    1.34    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.08   -0.06   -0.06 |    0.06    0.05    0.05
w_rewards |   -1.09 |    1.06 |   -7.11 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -38.55 |   21.01 |  -50.00 |    0.00
theta_cv |    1.39 |    0.67 |    0.00 |    3.13
seeker_angles |    0.04   -0.02 |    0.36    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0427 -0.0195 |  0.3550  0.3408 | -1.0000 -0.9999 |  1.0000  0.9997
optical_flow |  0.0006 -0.0002 |  0.0030  0.0033 | -0.0245 -0.2183 |  0.0505  0.0487
v_err    | -0.3280 |  0.2079 | -1.2344 |  0.9280
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  633.59 |  280.56 |   23.09 | 1228.38
tracking_rewards | -315.54 |  123.60 | -853.74 | -125.94
steps    |     355 |  

attitude |    0.05   -0.00    0.01 |    1.50    0.68    1.74 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.09   -0.08   -0.08 |    0.10    0.10    0.09
a_f      |    0.00   -0.02 |    0.66    1.72 |   -1.50   -3.13 |    1.51    3.06
w_f      |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.06   -0.05   -0.05 |    0.10    0.05    0.06
w_rewards |   -0.55 |    0.60 |   -4.16 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |  -43.55 |   16.76 |  -50.00 |    0.00
theta_cv |    1.15 |    0.59 |    0.00 |    3.12
seeker_angles |    0.04   -0.03 |    0.33    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0444 -0.0324 |  0.3334  0.3441 | -1.0000 -0.9999 |  1.0000  1.0000
optical_flow |  0.0008 -0.0003 |  0.0038  0.0038 | -0.0684 -0.0606 |  0.0418  0.0342
v_err    | -0.1994 |  0.2259 | -0.9664 |  1.0459
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  494

attitude |    0.03    0.02   -0.03 |    1.41    0.67    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.09   -0.06   -0.07 |    0.09    0.09    0.09
a_f      |    0.04   -0.15 |    0.67    1.82 |   -1.52   -3.14 |    1.52    3.10
w_f      |   -0.00   -0.00   -0.00 |    0.02    0.02    0.02 |   -0.06   -0.06   -0.05 |    0.05    0.06    0.04
w_rewards |   -0.39 |    0.44 |   -2.47 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -47.26 |   11.38 |  -50.00 |    0.00
theta_cv |    0.95 |    0.53 |    0.00 |    3.10
seeker_angles |    0.06   -0.02 |    0.33    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0566 -0.0224 |  0.3338  0.3318 | -0.9998 -0.9998 |  0.9999  1.0000
optical_flow |  0.0012 -0.0005 |  0.0044  0.0044 | -0.0347 -0.0496 |  0.0818  0.1005
v_err    | -0.1401 |  0.2224 | -1.1599 |  1.1562
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  419

attitude |    0.06   -0.01    0.10 |    1.36    0.67    1.92 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.09   -0.07   -0.08 |    0.08    0.09    0.09
a_f      |   -0.01    0.10 |    0.66    1.91 |   -1.43   -3.11 |    1.51    3.11
w_f      |   -0.00   -0.00   -0.00 |    0.02    0.02    0.02 |   -0.05   -0.04   -0.04 |    0.05    0.04    0.04
w_rewards |   -0.49 |    0.52 |   -2.52 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -46.13 |   13.36 |  -50.00 |    0.00
theta_cv |    0.79 |    0.46 |    0.00 |    3.12
seeker_angles |    0.09   -0.02 |    0.33    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0860 -0.0205 |  0.3319  0.3409 | -0.9989 -1.0000 |  0.9998  0.9990
optical_flow |  0.0016 -0.0006 |  0.0045  0.0046 | -0.0523 -0.0784 |  0.0740  0.0666
v_err    | -0.0939 |  0.1965 | -1.0119 |  0.7602
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  372

w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.09   -0.06   -0.08 |    0.07    0.09    0.09
a_f      |   -0.09    0.01 |    0.66    1.88 |   -1.50   -3.14 |    1.45    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.02 |   -0.04   -0.04   -0.05 |    0.04    0.04    0.05
w_rewards |   -0.53 |    0.52 |   -2.73 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -48.06 |    9.65 |  -50.00 |    0.00
theta_cv |    0.70 |    0.41 |    0.00 |    3.13
seeker_angles |    0.05   -0.02 |    0.33    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0522 -0.0154 |  0.3305  0.3288 | -0.9998 -0.9999 |  0.9998  0.9997
optical_flow |  0.0013 -0.0006 |  0.0051  0.0051 | -0.1374 -0.2427 |  0.0613  0.0582
v_err    | -0.0743 |  0.1653 | -0.6335 |  0.8150
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  328.73 |  152.55 |   10.44 |  821.11
tracking_rewards | -117.23 |   20.17 | -199.00 |  -70.64
steps    |     263 |  

w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.08   -0.05   -0.08 |    0.07    0.10    0.09
a_f      |    0.06    0.09 |    0.65    1.90 |   -1.47   -3.13 |    1.47    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.04 |    0.04    0.04    0.04
w_rewards |   -0.71 |    0.57 |   -2.74 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -47.58 |   10.73 |  -50.00 |    0.00
theta_cv |    0.65 |    0.38 |    0.00 |    3.13
seeker_angles |    0.07   -0.01 |    0.34    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0708 -0.0083 |  0.3410  0.3418 | -0.9998 -1.0000 |  1.0000  0.9998
optical_flow |  0.0012 -0.0003 |  0.0061  0.0057 | -0.1631 -0.1485 |  0.0815  0.1833
v_err    | -0.0675 |  0.1433 | -0.6312 |  0.6094
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  297.40 |  154.03 |   15.13 |  698.95
tracking_rewards | -110.33 |   21.97 | -203.08 |  -72.42
steps    |     270 |  

norm_wf  |    0.02 |    0.01 |    0.00 |    0.06
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.05    0.02   -0.22 |    1.25    0.66    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.09   -0.06   -0.08 |    0.06    0.10    0.10
a_f      |    0.02   -0.18 |    0.66    1.84 |   -1.41   -3.14 |    1.51    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.05    0.04    0.03
w_rewards |   -0.86 |    0.59 |   -2.72 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -47.90 |   10.02 |  -50.00 |    0.00
theta_cv |    0.61 |    0.37 |    0.00 |    3.09
seeker_angles |    0.04    0.02 |    0.34    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0392  0.0219 |  0.3388  0.3399 | -0.9997 -0.9989 |  1.0000  0.9998
optical

attitude |   -0.11   -0.04    0.15 |    1.26    0.68    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.02    0.02    0.01 |   -0.10   -0.06   -0.07 |    0.05    0.10    0.10
a_f      |   -0.04    0.15 |    0.70    1.81 |   -1.55   -3.11 |    1.43    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.04    0.10    0.04
w_rewards |   -0.82 |    0.51 |   -2.84 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |  -48.87 |    7.43 |  -50.00 |    0.00
theta_cv |    0.59 |    0.36 |    0.00 |    3.13
seeker_angles |   -0.00    0.03 |    0.32    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0039  0.0298 |  0.3224  0.3234 | -0.9999 -0.9997 |  0.9998  1.0000
optical_flow |  0.0003  0.0006 |  0.0071  0.0068 | -0.0886 -0.1936 |  0.1355  0.2167
v_err    | -0.0416 |  0.1284 | -0.5661 |  0.5845
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  223

w        |   -0.00    0.00    0.00 |    0.01    0.02    0.01 |   -0.10   -0.05   -0.08 |    0.07    0.10    0.10
a_f      |   -0.00   -0.03 |    0.63    1.79 |   -1.39   -3.13 |    1.47    3.10
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.10   -0.04   -0.03 |    0.04    0.10    0.03
w_rewards |   -0.85 |    0.54 |   -2.47 |   -0.01
w_penalty |   -0.65 |    8.01 | -100.00 |    0.00
fov_penalty |  -48.71 |    7.93 |  -50.00 |    0.00
theta_cv |    0.59 |    0.36 |    0.00 |    3.13
seeker_angles |   -0.01    0.01 |    0.31    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0102  0.0122 |  0.3128  0.3259 | -0.9997 -1.0000 |  1.0000  1.0000
optical_flow |  0.0004  0.0004 |  0.0085  0.0086 | -0.2747 -0.2655 |  0.2549  0.1750
v_err    | -0.0384 |  0.1221 | -0.5590 |  0.5934
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  198.47 |  139.49 |   10.54 |  981.25
tracking_rewards |  -95.78 |   18.80 | -152.25 |  -10.30
steps    |     288 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.06   -0.07 |    0.07    0.10    0.09
a_f      |   -0.00   -0.08 |    0.68    1.77 |   -1.44   -3.14 |    1.44    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.03   -0.04 |    0.04    0.03    0.04
w_rewards |   -0.83 |    0.48 |   -2.74 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -48.71 |    7.93 |  -50.00 |    0.00
theta_cv |    0.60 |    0.36 |    0.00 |    3.12
seeker_angles |   -0.01    0.01 |    0.31    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0099  0.0117 |  0.3133  0.3231 | -0.9993 -0.9996 |  0.9998  1.0000
optical_flow |  0.0004  0.0005 |  0.0087  0.0086 | -0.3000 -0.4492 |  0.1043  0.1527
v_err    | -0.0358 |  0.1163 | -0.5999 |  0.7369
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  185.47 |  122.67 |    0.06 |  623.32
tracking_rewards |  -93.57 |   18.34 | -160.24 |  -53.55
steps    |     292 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.06 |    0.06    0.10    0.10
a_f      |   -0.02   -0.05 |    0.71    1.87 |   -1.44   -3.13 |    1.50    3.14
w_f      |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.88 |    0.52 |   -2.34 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.81 |   13.86 |  -50.00 |    0.00
theta_cv |    0.61 |    0.36 |    0.00 |    3.12
seeker_angles |   -0.01   -0.02 |    0.31    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0091 -0.0203 |  0.3105  0.3173 | -0.9997 -0.9999 |  0.9998  1.0000
optical_flow | -0.0002  0.0003 |  0.0092  0.0094 | -0.2937 -0.1773 |  0.3369  0.3982
v_err    | -0.0315 |  0.1106 | -0.5304 |  0.9881
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  167.43 |  122.04 |    5.72 |  554.32
tracking_rewards |  -92.97 |   18.60 | -162.62 |  -57.72
steps    |     301 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.08 |    0.06    0.10    0.10
a_f      |    0.03   -0.07 |    0.66    1.91 |   -1.44   -3.12 |    1.42    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.10    0.03
w_rewards |   -0.91 |    0.56 |   -3.07 |   -0.02
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |  -45.65 |   14.10 |  -50.00 |    0.00
theta_cv |    0.63 |    0.37 |    0.00 |    3.13
seeker_angles |   -0.00   -0.02 |    0.31    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0016 -0.0226 |  0.3090  0.3216 | -1.0000 -0.9999 |  0.9998  0.9997
optical_flow | -0.0000  0.0004 |  0.0101  0.0099 | -0.1591 -0.2314 |  0.2309  0.1241
v_err    | -0.0315 |  0.1047 | -0.5032 |  0.5823
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  161.20 |  126.79 |   13.64 |  962.44
tracking_rewards |  -91.94 |   17.20 | -139.25 |  -11.75
steps    |     303 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.06    0.10    0.10
a_f      |    0.06    0.29 |    0.64    1.90 |   -1.40   -3.13 |    1.45    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.04    0.05    0.10
w_rewards |   -0.93 |    0.55 |   -3.23 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |  -44.35 |   15.82 |  -50.00 |    0.00
theta_cv |    0.61 |    0.36 |    0.00 |    3.14
seeker_angles |   -0.01   -0.02 |    0.31    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0060 -0.0240 |  0.3099  0.3164 | -1.0000 -0.9999 |  0.9998  1.0000
optical_flow | -0.0004  0.0003 |  0.0104  0.0113 | -0.1980 -0.8099 |  0.4472  0.3518
v_err    | -0.0278 |  0.1032 | -0.6588 |  0.7176
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  143.38 |  115.53 |    3.10 |  903.08
tracking_rewards |  -91.63 |   19.35 | -162.95 |   -7.84
steps    |     309 |  

attitude |    0.05   -0.01   -0.08 |    1.26    0.68    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.06    0.10    0.10
a_f      |   -0.04   -0.05 |    0.68    1.85 |   -1.53   -3.14 |    1.45    3.11
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.10    0.10
w_rewards |   -0.92 |    0.54 |   -2.81 |   -0.01
w_penalty |   -0.97 |    9.79 | -100.00 |    0.00
fov_penalty |  -45.81 |   13.86 |  -50.00 |    0.00
theta_cv |    0.62 |    0.35 |    0.00 |    3.13
seeker_angles |    0.00   -0.03 |    0.31    0.31 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0030 -0.0259 |  0.3103  0.3064 | -0.9999 -0.9995 |  0.9999  0.9997
optical_flow | -0.0001  0.0001 |  0.0116  0.0105 | -0.2354 -0.2347 |  0.8362  0.3230
v_err    | -0.0267 |  0.0965 | -0.5157 |  0.6759
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  143

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.09    0.10    0.10
a_f      |   -0.01    0.13 |    0.62    1.84 |   -1.45   -3.12 |    1.48    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.09    0.04    0.03
w_rewards |   -0.92 |    0.52 |   -4.44 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.65 |   14.10 |  -50.00 |    0.00
theta_cv |    0.62 |    0.35 |    0.00 |    3.10
seeker_angles |    0.00    0.01 |    0.31    0.30 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0030  0.0112 |  0.3111  0.3003 | -0.9999 -1.0000 |  0.9994  0.9995
optical_flow |  0.0001 -0.0001 |  0.0117  0.0110 | -0.5524 -0.3602 |  0.2340  0.2185
v_err    | -0.0248 |  0.0967 | -0.5038 |  0.7298
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  132.10 |  102.26 |    1.00 |  456.88
tracking_rewards |  -87.41 |   17.36 | -140.48 |  -54.27
steps    |     308 |  

attitude |   -0.07    0.01   -0.01 |    1.30    0.69    1.89 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.05    0.09    0.09
a_f      |    0.01   -0.08 |    0.70    1.89 |   -1.34   -3.13 |    1.48    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.03 |    0.04    0.03    0.04
w_rewards |   -0.89 |    0.48 |   -2.33 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -42.58 |   17.77 |  -50.00 |    0.00
theta_cv |    0.62 |    0.35 |    0.00 |    3.03
seeker_angles |    0.01    0.02 |    0.31    0.31 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0136  0.0162 |  0.3064  0.3104 | -0.9997 -0.9995 |  0.9998  1.0000
optical_flow | -0.0000  0.0001 |  0.0124  0.0120 | -0.5573 -1.0613 |  1.0373  0.3945
v_err    | -0.0208 |  0.0948 | -0.6266 |  0.8058
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  130

thrust   |   -0.00   -0.00    0.00 |    0.99    1.00    1.00 |   -3.37   -3.41   -3.43 |    3.44    3.43    3.45
norm_thrust |    1.58 |    0.68 |    0.00 |    3.46
fuel     |    4.40 |    0.68 |    0.19 |    5.55
rewards  | -147.23 |   21.48 | -230.79 |  -69.43
fuel_rewards |  -12.60 |    1.94 |  -15.87 |   -0.56
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.59 |   15.49 |    0.01 |  149.95
norm_af  |    1.75 |    0.88 |    0.01 |    3.28
norm_wf  |    0.02 |    0.01 |    0.00 |    0.11
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.03    0.06   -0.00 |    1.23    0.68    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.05    0.10    0.10
a_f      |    0.07   -0.04 |    0.67

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3338   0.0912   0.5478   0.9962   0.5001   0.2145
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0217   0.0092   0.0450   6.6368   2.2852   2.4929
Update Cnt = 230    ET =   1065.7   Stats:  Mean, Std, Min, Max
r_f      |  -14.18   22.36    3.43 |  229.13  217.00  246.16 | -718.44 -539.44 -750.78 |  496.03  592.92  600.36
v_f      |    0.01   -0.04   -0.01 |    0.31    0.30    0.30 |   -0.73   -0.87   -0.72 |    0.98    1.04    0.88
r_i      |  -48.18   92.10   17.10 |  684.39  674.72  739.38 |-1337.39-1348.37-1338.64 | 1260.38 1313.13 1358.83
v_i      |    0.00   -0.01   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.10    0.10
norm_rf  |  103.63 |   95.37 |    1.43 |  500.40
norm_vf  |    0.49 |    0.19 |    0.12 |    1.22
gs_f     |    0.98 |    1.22 |    0.04 |   11.76
thrust   |    0.01   -0.01    0.00 |    1.00    1.00    0.99 |   -3.43   -3.43   -3.46 |    3.28    3.30    3.41
norm_thrust |    1

ADV1:  -0.00641533490189037 0.169146862289554 2.2681173356374105 -1.709478051662447
ADV2:  0.003965137899140981 0.7219301075335364 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3353   0.0659   0.5288   1.1842   0.6387   0.2251
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0206   0.0047   0.0326   6.6368   2.2852   2.4929
***** Episode 7455, Mean R = -151.3  Std R = 18.8  Min R = -189.7
PolicyLoss: -0.00382
Policy_Beta: 0.0667
Policy_Entropy: 0.00501
Policy_KL: 0.00112
Policy_SD: 0.942
Policy_lr_mult: 1
Steps: 9.87e+03
TotalSteps: 2.23e+06
VF_0_ExplainedVarNew: 0.87
VF_0_ExplainedVarOld: 0.817
VF_0_Loss : 0.0588


ADV1:  0.018905628778476534 0.13920397420099512 2.262232360839844 -1.049866060215931
ADV2:  -0.018892078246493686 0.7095125998290405 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3772   0.1475   0.8975   1.1842   0.6387   0.2251
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0311   0.0136   0.0643   6.6368   2.2852   2.4929
Update C

ADV1:  0.010484767886122336 0.1887585741334534 2.4496281719207764 -1.1819759321212788
ADV2:  -0.019605344457098006 0.745136993457199 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4018   0.1549   0.7751   1.3823   0.6387   0.2634
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0216   0.0088   0.0432   6.6368   2.2852   2.4929
***** Episode 7734, Mean R = -141.3  Std R = 23.1  Min R = -182.1
PolicyLoss: 0.0126
Policy_Beta: 0.0667
Policy_Entropy: 0.0051
Policy_KL: 0.00099
Policy_SD: 0.939
Policy_lr_mult: 1
Steps: 1.04e+04
TotalSteps: 2.32e+06
VF_0_ExplainedVarNew: 0.803
VF_0_ExplainedVarOld: 0.745
VF_0_Loss : 0.063


ADV1:  -0.0055900814772537055 0.15577895678443526 1.7917086304066356 -1.2853276671561762
ADV2:  -0.01031039148292071 0.7451211152025404 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4730   0.1435   0.7630   1.3823   0.6387   0.2634
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0216   0.0092   0.0449   6.6368   2.2852   2.4929
***** 

ADV1:  0.025403872016662388 0.23441140398529148 2.311352071762085 -1.4192871973408239
ADV2:  -0.04665392030917327 0.7176984080778266 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4099   0.1452   0.7990   1.3823   0.6387   0.2634
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0290   0.0195   0.0841   6.6368   2.2852   2.4929
***** Episode 8013, Mean R = -137.9  Std R = 29.1  Min R = -191.5
PolicyLoss: 0.0364
Policy_Beta: 0.0667
Policy_Entropy: 0.0054
Policy_KL: 0.000869
Policy_SD: 0.938
Policy_lr_mult: 1
Steps: 1.04e+04
TotalSteps: 2.41e+06
VF_0_ExplainedVarNew: 0.701
VF_0_ExplainedVarOld: 0.568
VF_0_Loss : 0.0761


ADV1:  0.029207174097449502 0.22426772102676765 2.1168439640230994 -1.5676143773396833
ADV2:  -0.036384749752993176 0.751900903708574 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6699   0.2306   1.2650   1.3823   0.6699   0.2634
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0418   0.0223   0.1089   6.6368   2.2852   2.4929
***** 

Dynamics: Max Disturbance (m/s^2):  [0.00118519 0.00130788 0.00135945] 0.0022278467605863807
ADV1:  7.364075673127681e-05 0.18893543113154385 2.24760085105896 -1.5847313427925132
ADV2:  -0.020603695729163873 0.7216059519748661 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4491   0.1520   0.8422   1.4274   0.7253   0.3144
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0168   0.0060   0.0279   6.6368   2.2852   2.4929
***** Episode 8292, Mean R = -127.3  Std R = 31.0  Min R = -188.2
PolicyLoss: 0.0193
Policy_Beta: 0.0667
Policy_Entropy: 0.00551
Policy_KL: 0.00123
Policy_SD: 0.938
Policy_lr_mult: 1
Steps: 1.03e+04
TotalSteps: 2.5e+06
VF_0_ExplainedVarNew: 0.771
VF_0_ExplainedVarOld: 0.712
VF_0_Loss : 0.0704


ADV1:  0.02561687328944146 0.2382079985448424 2.3365447025293027 -1.5809906442960124
ADV2:  -0.040559603760850695 0.7050229185481874 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2857   0.1167   0.5271   1.4274   0.7253   0.3144
ValFun  Gradients

Dynamics: Max Disturbance (m/s^2):  [0.00118519 0.00130788 0.00135945] 0.0022278467605863807
ADV1:  0.0118228817806753 0.207195700166509 1.9730855450549096 -1.3475920878645105
ADV2:  -0.031580643857914634 0.7368984059918415 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2492   0.0671   0.3805   1.4274   0.7253   0.3144
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0199   0.0068   0.0367   6.6368   2.2852   2.4929
***** Episode 8571, Mean R = -125.8  Std R = 26.2  Min R = -163.0
PolicyLoss: 0.0257
Policy_Beta: 0.0667
Policy_Entropy: 0.00569
Policy_KL: 0.00112
Policy_SD: 0.936
Policy_lr_mult: 1
Steps: 1.04e+04
TotalSteps: 2.6e+06
VF_0_ExplainedVarNew: 0.667
VF_0_ExplainedVarOld: 0.618
VF_0_Loss : 0.0691


ADV1:  -0.030702873890737677 0.1977632248461635 2.2114568328857422 -1.813979180653892
ADV2:  0.024474138521378058 0.7160387904305299 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3828   0.1263   0.7466   1.4274   0.7253   0.3144
ValFun  Gradients: u

ADV1:  0.009746857184375575 0.17449315657148864 2.009087619781494 -1.6132877196077469
ADV2:  -0.024423003832797663 0.7253640668583569 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5892   0.2057   1.0909   1.4274   0.7253   0.3144
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0193   0.0079   0.0389   6.6368   2.2852   2.4929
***** Episode 8850, Mean R = -139.4  Std R = 26.4  Min R = -185.9
PolicyLoss: 0.0175
Policy_Beta: 0.0667
Policy_Entropy: 0.00604
Policy_KL: 0.000905
Policy_SD: 0.936
Policy_lr_mult: 1
Steps: 1.06e+04
TotalSteps: 2.69e+06
VF_0_ExplainedVarNew: 0.812
VF_0_ExplainedVarOld: 0.777
VF_0_Loss : 0.0698


Dynamics: Max Disturbance (m/s^2):  [0.00118519 0.00130788 0.00135945] 0.0022278467605863807
ADV1:  0.030117566937904346 0.19861660924416366 2.2832967109855065 -1.259314479827883
ADV2:  -0.05534236080363703 0.6636809612138301 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4801   0.1930   0.9881   1.4274   0.7253   0.3144
ValFun  Gradien

ADV1:  0.025147226957496473 0.2382640808816443 2.055839595794678 -1.7324181811014832
ADV2:  -0.03161382350064047 0.731986117447147 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4687   0.1375   0.7589   1.4274   0.7253   0.3144
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0413   0.0214   0.1112   6.6368   2.2852   2.4929
***** Episode 9129, Mean R = -133.5  Std R = 31.7  Min R = -192.2
PolicyLoss: 0.0209
Policy_Beta: 0.0667
Policy_Entropy: 0.00665
Policy_KL: 0.00103
Policy_SD: 0.934
Policy_lr_mult: 1
Steps: 1.08e+04
TotalSteps: 2.79e+06
VF_0_ExplainedVarNew: 0.621
VF_0_ExplainedVarOld: 0.5
VF_0_Loss : 0.0796


Dynamics: Max Disturbance (m/s^2):  [0.00118519 0.00130788 0.00135945] 0.0022278467605863807
ADV1:  0.02619004784153367 0.21599381058985864 2.212460345952239 -1.6237884173684778
ADV2:  -0.03463528617253252 0.7291091478809021 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3627   0.1043   0.5191   1.4274   0.7253   0.3144
ValFun  Gradients: u/s

ADV1:  0.005562740173939579 0.20862519695605528 1.7386910009384156 -1.943034381866457
ADV2:  0.005284379931116274 0.7377512599472135 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5261   0.1946   1.1708   1.4274   0.7253   0.3144
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0258   0.0069   0.0378   6.6368   2.2852   2.4929
***** Episode 9408, Mean R = -128.9  Std R = 33.4  Min R = -170.8
PolicyLoss: -0.0119
Policy_Beta: 0.0667
Policy_Entropy: 0.00703
Policy_KL: 0.0011
Policy_SD: 0.936
Policy_lr_mult: 1
Steps: 1.04e+04
TotalSteps: 2.89e+06
VF_0_ExplainedVarNew: 0.766
VF_0_ExplainedVarOld: 0.647
VF_0_Loss : 0.0616


ADV1:  0.007441703514404279 0.18065707891669322 1.7741831297054926 -1.940465898513796
ADV2:  0.0066740011385206886 0.7504929563734792 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4189   0.1490   0.8492   1.4274   0.7253   0.3144
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0228   0.0070   0.0401   6.6368   2.2852   2.4929
***** 

ADV1:  -0.013647135018993022 0.23239745386928218 2.0279667059580486 -4.671266507054404
ADV2:  0.023713905050967356 0.6936254377075295 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4174   0.1106   0.7272   1.4274   0.7253   0.3144
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0320   0.0126   0.0549   6.6368   2.2852   2.4929
***** Episode 9687, Mean R = -117.3  Std R = 34.1  Min R = -180.6
PolicyLoss: -0.024
Policy_Beta: 0.0667
Policy_Entropy: 0.0072
Policy_KL: 0.00124
Policy_SD: 0.931
Policy_lr_mult: 1
Steps: 1.07e+04
TotalSteps: 2.98e+06
VF_0_ExplainedVarNew: 0.545
VF_0_ExplainedVarOld: 0.48
VF_0_Loss : 0.0663


ADV1:  -0.018564814141977755 0.20741790465241336 1.394520370165507 -1.9308984267128007
ADV2:  0.032599922298160916 0.7609464388973753 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4694   0.1807   0.8229   1.4274   0.7253   0.3144
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0356   0.0149   0.0657   6.6368   2.2852   2.4929
***** E

theta_cv |    0.57 |    0.32 |    0.00 |    3.04
seeker_angles |   -0.00    0.02 |    0.26    0.27 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0002  0.0203 |  0.2579  0.2719 | -0.9994 -0.9997 |  0.9993  0.9990
optical_flow |  0.0002  0.0001 |  0.0208  0.0211 | -1.0087 -1.2429 |  0.9478  0.9696
v_err    | -0.0145 |  0.0757 | -0.5131 |  0.7228
landing_rewards |    0.90 |    2.87 |    0.00 |   10.00
landing_margin |   32.02 |   76.84 |   -0.06 |  869.80
tracking_rewards |  -80.41 |   18.19 | -131.81 |   -9.57
steps    |     350 |      38 |      14 |     411
***** Episode 9966, Mean R = -123.1  Std R = 42.2  Min R = -211.3
PolicyLoss: -0.0212
Policy_Beta: 0.0667
Policy_Entropy: 0.00797
Policy_KL: 0.00104
Policy_SD: 0.931
Policy_lr_mult: 1
Steps: 1.07e+04
TotalSteps: 3.08e+06
VF_0_ExplainedVarNew: 0.721
VF_0_ExplainedVarOld: 0.588
VF_0_Loss : 0.05


ADV1:  0.00025012557646569166 0.1940225640783589 2.4352410411834717 -2.002643139362337
ADV2:  0.021547348780088862 0.7139464835673538 3.

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.06    0.08    0.08
a_f      |    0.00   -0.24 |    0.69    1.78 |   -1.48   -3.13 |    1.52    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.02    0.02 |   -0.03   -0.04   -0.05 |    0.03    0.06    0.06
w_rewards |   -0.65 |    0.38 |   -1.72 |   -0.02
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -22.42 |   24.87 |  -50.00 |    0.00
theta_cv |    0.56 |    0.30 |    0.00 |    2.90
seeker_angles |   -0.00    0.01 |    0.24    0.26 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0020  0.0097 |  0.2373  0.2612 | -0.9994 -0.9995 |  0.9996  1.0000
optical_flow |  0.0002  0.0003 |  0.0190  0.0232 | -0.8688 -1.0576 |  0.8541  0.7853
v_err    | -0.0130 |  0.0728 | -0.4999 |  0.5106
landing_rewards |    1.39 |    3.46 |    0.00 |   10.00
landing_margin |   25.90 |   65.57 |   -0.06 |  418.48
tracking_rewards |  -78.19 |   16.73 | -145.13 |  -44.12
steps    |     356 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.06 |    0.06    0.09    0.09
a_f      |   -0.01   -0.03 |    0.71    1.75 |   -1.45   -3.10 |    1.49    3.12
w_f      |    0.00   -0.00   -0.00 |    0.01    0.02    0.02 |   -0.04   -0.05   -0.06 |    0.03    0.05    0.05
w_rewards |   -0.74 |    0.52 |   -3.20 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -21.13 |   24.70 |  -50.00 |    0.00
theta_cv |    0.55 |    0.29 |    0.00 |    3.08
seeker_angles |   -0.01    0.01 |    0.23    0.25 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0085  0.0055 |  0.2323  0.2473 | -0.9977 -0.9997 |  0.9998  0.9995
optical_flow |  0.0001  0.0003 |  0.0209  0.0243 | -0.9653 -1.4082 |  0.7858  0.8480
v_err    | -0.0125 |  0.0726 | -0.4997 |  0.5004
landing_rewards |    1.81 |    3.85 |    0.00 |   10.00
landing_margin |   14.94 |   43.94 |   -0.08 |  346.80
tracking_rewards |  -76.27 |   16.51 | -120.74 |  -41.36
steps    |     359 |  

attitude |   -0.02    0.05   -0.06 |    1.34    0.66    1.92 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.06    0.09    0.09
a_f      |    0.06   -0.07 |    0.66    1.85 |   -1.50   -3.13 |    1.50    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.02    0.02 |   -0.04   -0.05   -0.05 |    0.04    0.04    0.05
w_rewards |   -0.71 |    0.45 |   -2.32 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -14.68 |   22.77 |  -50.00 |    0.00
theta_cv |    0.54 |    0.29 |    0.00 |    2.97
seeker_angles |   -0.02    0.01 |    0.22    0.24 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0161  0.0114 |  0.2209  0.2362 | -1.0000 -0.9990 |  0.9982  0.9987
optical_flow |  0.0001  0.0003 |  0.0224  0.0255 | -0.8161 -1.5546 |  1.2931  1.1061
v_err    | -0.0115 |  0.0716 | -0.5375 |  0.4626
landing_rewards |    2.42 |    4.28 |    0.00 |   10.00
landing_margin |    8

attitude |    0.02    0.02   -0.02 |    1.18    0.67    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.06 |    0.05    0.10    0.09
a_f      |    0.05   -0.15 |    0.69    1.84 |   -1.53   -3.13 |    1.45    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.02    0.02 |   -0.03   -0.05   -0.04 |    0.04    0.07    0.05
w_rewards |   -0.66 |    0.48 |   -2.50 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -10.81 |   20.58 |  -50.00 |    0.00
theta_cv |    0.51 |    0.29 |    0.00 |    2.83
seeker_angles |   -0.02   -0.00 |    0.20    0.22 |   -0.99   -1.00 |    0.99    1.00
cs_angles | -0.0242 -0.0040 |  0.1995  0.2232 | -0.9936 -1.0000 |  0.9924  0.9997
optical_flow |  0.0003  0.0001 |  0.0223  0.0252 | -0.6963 -1.0827 |  0.8997  1.0042
v_err    | -0.0099 |  0.0710 | -0.4801 |  0.3387
landing_rewards |    3.42 |    4.74 |    0.00 |   10.00
landing_margin |    4

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.06 |    0.07    0.09    0.08
a_f      |    0.00    0.12 |    0.64    1.83 |   -1.38   -3.13 |    1.48    3.13
w_f      |    0.00   -0.00   -0.00 |    0.01    0.02    0.02 |   -0.03   -0.05   -0.06 |    0.04    0.06    0.05
w_rewards |   -0.62 |    0.44 |   -2.11 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -8.23 |   18.54 |  -50.00 |    0.00
theta_cv |    0.49 |    0.29 |    0.00 |    2.93
seeker_angles |   -0.02    0.01 |    0.20    0.20 |   -1.00   -0.98 |    1.00    1.00
cs_angles | -0.0153  0.0121 |  0.1957  0.2024 | -0.9975 -0.9843 |  0.9957  0.9981
optical_flow |  0.0002  0.0005 |  0.0244  0.0265 | -1.1731 -1.2027 |  1.0373  1.4992
v_err    | -0.0089 |  0.0696 | -0.5002 |  0.4787
landing_rewards |    4.03 |    4.91 |    0.00 |   10.00
landing_margin |    3.65 |   22.37 |   -0.08 |  382.73
tracking_rewards |  -66.65 |   17.15 | -125.45 |  -36.87
steps    |     367 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.06    0.09    0.08
a_f      |   -0.02    0.05 |    0.64    1.90 |   -1.51   -3.12 |    1.25    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.02    0.02 |   -0.03   -0.04   -0.05 |    0.04    0.05    0.05
w_rewards |   -0.67 |    0.44 |   -2.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -3.87 |   13.36 |  -50.00 |    0.00
theta_cv |    0.48 |    0.29 |    0.00 |    2.79
seeker_angles |   -0.02    0.01 |    0.17    0.20 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0170  0.0058 |  0.1746  0.1990 | -0.9979 -0.9976 |  0.9997  0.9975
optical_flow |  0.0005  0.0005 |  0.0249  0.0254 | -1.0709 -0.8320 |  1.2411  1.2622
v_err    | -0.0087 |  0.0695 | -0.5011 |  0.5065
landing_rewards |    4.35 |    4.96 |    0.00 |   10.00
landing_margin |    4.59 |   41.16 |   -0.08 |  590.52
tracking_rewards |  -64.26 |   15.82 | -129.26 |  -37.99
steps    |     370 |  

glideslope |    2.94 |   13.04 |    0.01 |  211.87
norm_af  |    1.65 |    0.90 |    0.05 |    3.27
norm_wf  |    0.03 |    0.01 |    0.00 |    0.06
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.01   -0.05    0.10 |    1.23    0.67    1.80 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.06    0.08    0.08
a_f      |   -0.04    0.23 |    0.65    1.75 |   -1.52   -3.14 |    1.52    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.02    0.02 |   -0.04   -0.05   -0.05 |    0.03    0.05    0.05
w_rewards |   -0.61 |    0.40 |   -1.80 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -1.61 |    8.83 |  -50.00 |    0.00
theta_cv |    0.45 |    0.28 |    0.00 |    2.97
seeker_angles |   -0.03   -0.01 |    0.15    0.18 |   -1.00   -0.98 |    1.

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.09    0.08
a_f      |    0.03    0.09 |    0.66    1.95 |   -1.45   -3.14 |    1.34    3.13
w_f      |    0.00   -0.00   -0.00 |    0.01    0.02    0.02 |   -0.03   -0.04   -0.05 |    0.04    0.05    0.05
w_rewards |   -0.61 |    0.43 |   -2.66 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -1.61 |    8.83 |  -50.00 |    0.00
theta_cv |    0.47 |    0.28 |    0.00 |    2.72
seeker_angles |   -0.02   -0.02 |    0.16    0.17 |   -1.00   -0.99 |    1.00    1.00
cs_angles | -0.0214 -0.0206 |  0.1637  0.1696 | -0.9994 -0.9929 |  0.9972  0.9978
optical_flow |  0.0004  0.0004 |  0.0257  0.0261 | -0.9906 -1.0816 |  1.2210  0.9406
v_err    | -0.0128 |  0.0675 | -0.5103 |  0.3633
landing_rewards |    5.35 |    4.99 |    0.00 |   10.00
landing_margin |    3.54 |   54.94 |   -0.09 |  968.39
tracking_rewards |  -59.21 |   14.17 | -115.67 |  -33.67
steps    |     373 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.05    0.08    0.08
a_f      |    0.05   -0.04 |    0.65    1.87 |   -1.53   -3.12 |    1.52    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.02    0.02 |   -0.03   -0.04   -0.04 |    0.04    0.04    0.05
w_rewards |   -0.60 |    0.45 |   -2.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.65 |    5.64 |  -50.00 |    0.00
theta_cv |    0.45 |    0.28 |    0.00 |    3.05
seeker_angles |   -0.01   -0.01 |    0.15    0.16 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0099 -0.0112 |  0.1509  0.1593 | -0.9954 -0.9982 |  0.9971  0.9999
optical_flow |  0.0004  0.0002 |  0.0267  0.0273 | -1.0547 -1.1336 |  0.9533  1.0329
v_err    | -0.0113 |  0.0652 | -0.4999 |  0.4342
landing_rewards |    5.94 |    4.91 |    0.00 |   10.00
landing_margin |    1.39 |   22.10 |   -0.08 |  389.35
tracking_rewards |  -54.85 |   12.89 | -101.37 |  -32.04
steps    |     372 |  

norm_thrust |    1.43 |    0.68 |    0.00 |    3.46
fuel     |    3.65 |    0.25 |    3.07 |    4.37
rewards  |  -59.15 |   18.43 | -146.56 |  -30.00
fuel_rewards |  -10.45 |    0.71 |  -12.52 |   -8.77
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.87 |   12.81 |    0.01 |  166.02
norm_af  |    1.71 |    0.88 |    0.04 |    3.27
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.02   -0.03    0.11 |    1.18    0.66    1.81 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.06 |    0.05    0.08    0.08
a_f      |   -0.01   -0.11 |    0.67    1.80 |   -1.44   -3.13 |    1.51    3.10
w_f      |    0.00    0.00    0.00 |    0.01    0.02    0.02 |   -0.

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1103   0.7244   3.3076   8.6145   4.1750   3.4057
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0047   0.0025   0.0107   6.6368   2.2852   2.4929
Update Cnt = 430    ET =    924.8   Stats:  Mean, Std, Min, Max
r_f      |  -10.09    2.81   20.34 |  188.16  160.59  203.95 | -405.61 -391.90 -394.14 |  382.80  391.81  389.05
v_f      |    0.01    0.00   -0.01 |    0.06    0.06    0.06 |   -0.16   -0.15   -0.17 |    0.38    0.15    0.15
r_i      |  -39.85   -5.95   67.87 |  665.57  629.97  791.27 |-1300.23-1294.06-1369.81 | 1315.75 1336.45 1337.88
v_i      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.10 |    0.09    0.09    0.10
norm_rf  |    0.71 |    1.38 |    0.09 |   20.37
norm_vf  |    0.10 |    0.04 |    0.02 |    0.41
gs_f     |    1.30 |    1.72 |    0.01 |   12.28
thrust   |   -0.00    0.00   -0.00 |    0.88    0.91    0.89 |   -3.46   -3.46   -3.45 |    3.46    3.46    3.46
norm_thrust |    1

ADV1:  -0.001468020623637234 0.018620932753199988 0.1084344989061356 -0.10599499739841439
ADV2:  0.0002314145720231024 0.9340480111657108 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8533   0.4117   2.2688   8.6145   4.1750   3.4057
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0011   0.0050   6.6368   2.2852   2.4929
***** Episode 13655, Mean R = -51.6  Std R = 13.6  Min R = -98.9
PolicyLoss: 0.000565
Policy_Beta: 0.0667
Policy_Entropy: 0.0231
Policy_KL: 0.00096
Policy_SD: 0.816
Policy_lr_mult: 0.667
Steps: 1.17e+04
TotalSteps: 4.44e+06
VF_0_ExplainedVarNew: 0.93
VF_0_ExplainedVarOld: 0.925
VF_0_Loss : 0.00998


ADV1:  0.0025230615670917417 0.024269806374077524 0.28034090650011984 -0.17455400957186867
ADV2:  -0.0021080790746066664 0.8748589988663935 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7369   0.3559   2.1795   8.6145   4.1750   3.4057
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0042   0.0023   0.0089   6.6368   2.2852 

***** Episode 13903, Mean R = -46.1  Std R = 16.3  Min R = -117.6
PolicyLoss: -0.0344
Policy_Beta: 0.0667
Policy_Entropy: 0.0252
Policy_KL: 0.000692
Policy_SD: 0.804
Policy_lr_mult: 0.667
Steps: 1.15e+04
TotalSteps: 4.53e+06
VF_0_ExplainedVarNew: 0.945
VF_0_ExplainedVarOld: 0.901
VF_0_Loss : 0.0133


ADV1:  -0.0061379167784832355 0.01798722590985759 0.10607972390368318 -0.14950172596758698
ADV2:  0.02884745937529142 0.9301826922183167 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8051   0.4230   2.0214   8.6145   4.1750   3.4057
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0094   0.0058   0.0206   6.6368   2.2852   2.4929
***** Episode 13934, Mean R = -45.6  Std R = 7.8  Min R = -59.8
PolicyLoss: -0.00774
Policy_Beta: 0.0667
Policy_Entropy: 0.0247
Policy_KL: 0.0008
Policy_SD: 0.803
Policy_lr_mult: 0.667
Steps: 1.17e+04
TotalSteps: 4.54e+06
VF_0_ExplainedVarNew: 0.922
VF_0_ExplainedVarOld: 0.92
VF_0_Loss : 0.0126


ADV1:  -0.00021816901310793492 0.020576011317448

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6620   0.2775   1.5781   8.6145   4.1750   3.4057
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0058   0.0033   0.0130   6.6368   2.2852   2.4929
***** Episode 14182, Mean R = -46.6  Std R = 13.1  Min R = -75.0
PolicyLoss: -0.0181
Policy_Beta: 0.0667
Policy_Entropy: 0.0287
Policy_KL: 0.000798
Policy_SD: 0.794
Policy_lr_mult: 0.667
Steps: 1.16e+04
TotalSteps: 4.64e+06
VF_0_ExplainedVarNew: 0.912
VF_0_ExplainedVarOld: 0.902
VF_0_Loss : 0.0132


ADV1:  -0.0007875083573061032 0.019198804136207878 0.12362587591012322 -0.1792550002696341
ADV2:  0.013004293705040651 0.9015476722654583 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9081   1.8425   5.9181   8.6145   4.1750   3.4057
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0016   0.0065   6.6368   2.2852   2.4929
***** Episode 14213, Mean R = -44.6  Std R = 9.7  Min R = -68.7
PolicyLoss: -0.014
Policy_Beta: 0.0667
Policy_Entropy: 0.0289
Policy_KL: 0.0

ADV1:  0.001565183087488199 0.017984652402947582 0.09139072283095512 -0.12290854086408196
ADV2:  -0.004759365304157757 0.9445257156639734 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7492   0.3053   1.3568   8.6145   4.1750   3.4057
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0014   0.0054   6.6368   2.2852   2.4929
***** Episode 14461, Mean R = -43.2  Std R = 8.8  Min R = -57.3
PolicyLoss: -0.00399
Policy_Beta: 0.0667
Policy_Entropy: 0.0304
Policy_KL: 0.00078
Policy_SD: 0.778
Policy_lr_mult: 0.667
Steps: 1.17e+04
TotalSteps: 4.74e+06
VF_0_ExplainedVarNew: 0.941
VF_0_ExplainedVarOld: 0.936
VF_0_Loss : 0.00868


ADV1:  -0.0002092014020355473 0.017829053702874794 0.09189868714395516 -0.13353260319925697
ADV2:  0.0036409753817065607 0.9339383596813655 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7741   0.4099   1.9327   8.6145   4.1750   3.4057
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0022   6.6368   2.2852 

***** Episode 14709, Mean R = -40.4  Std R = 10.1  Min R = -68.1
PolicyLoss: -0.00519
Policy_Beta: 0.0667
Policy_Entropy: 0.0356
Policy_KL: 0.000941
Policy_SD: 0.756
Policy_lr_mult: 0.667
Steps: 1.16e+04
TotalSteps: 4.83e+06
VF_0_ExplainedVarNew: 0.949
VF_0_ExplainedVarOld: 0.947
VF_0_Loss : 0.011


ADV1:  -0.0016528136186239727 0.019346498952614668 0.1490621523328876 -0.09381238507696554
ADV2:  0.003235652420473692 0.9333750832342604 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1730   0.6624   3.4836   8.6145   4.1750   3.4057
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0014   0.0055   6.6368   2.2852   2.4929
***** Episode 14740, Mean R = -43.4  Std R = 11.9  Min R = -67.3
PolicyLoss: -0.000966
Policy_Beta: 0.0667
Policy_Entropy: 0.0362
Policy_KL: 0.000723
Policy_SD: 0.755
Policy_lr_mult: 0.667
Steps: 1.17e+04
TotalSteps: 4.85e+06
VF_0_ExplainedVarNew: 0.926
VF_0_ExplainedVarOld: 0.922
VF_0_Loss : 0.00875


ADV1:  0.00026904530837428914 0.0191263952

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0502   0.6385   2.6911   8.6702   4.1750   3.4057
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0076   0.0053   0.0164   6.6368   2.2852   2.4929
***** Episode 14988, Mean R = -41.7  Std R = 9.2  Min R = -65.2
PolicyLoss: -0.0118
Policy_Beta: 0.0667
Policy_Entropy: 0.0405
Policy_KL: 0.000771
Policy_SD: 0.728
Policy_lr_mult: 0.667
Steps: 1.17e+04
TotalSteps: 4.94e+06
VF_0_ExplainedVarNew: 0.919
VF_0_ExplainedVarOld: 0.91
VF_0_Loss : 0.00915


ADV1:  0.003543069354833385 0.020634112544059394 0.1967234122851562 -0.15484278122139247
ADV2:  -0.007769211391690451 0.9306141257751457 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8368   0.2885   1.4020   8.6702   4.1750   3.4057
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0045   0.0028   0.0108   6.6368   2.2852   2.4929
***** Episode 15019, Mean R = -47.2  Std R = 13.3  Min R = -88.6
PolicyLoss: -0.00585
Policy_Beta: 0.0667
Policy_Entropy: 0.0402
Policy_KL: 0.

ADV1:  0.0006657629820784499 0.019351779656500014 0.11800085812807087 -0.12529483880036435
ADV2:  -0.001031240764289286 0.9259061863176712 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8689   0.4246   2.2221  11.3361   4.9073   3.5031
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0009   0.0040   6.6368   2.2852   2.4929
***** Episode 15267, Mean R = -45.4  Std R = 11.0  Min R = -64.3
PolicyLoss: -0.0057
Policy_Beta: 0.0667
Policy_Entropy: 0.0425
Policy_KL: 0.000744
Policy_SD: 0.744
Policy_lr_mult: 0.667
Steps: 1.18e+04
TotalSteps: 5.04e+06
VF_0_ExplainedVarNew: 0.932
VF_0_ExplainedVarOld: 0.929
VF_0_Loss : 0.0119


ADV1:  -0.0003206720709386994 0.017497112692161573 0.10753419733993486 -0.1225625960452632
ADV2:  0.004284233789269802 0.9414952921217028 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.9501   3.0909   8.6396  11.3361   4.9073   3.5031
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0002   0.0009   6.6368   2.2852  

seeker_angles |    0.00   -0.00 |    0.12    0.11 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0012 -0.0007 |  0.1196  0.1137 | -0.9967 -0.9986 |  0.9993  0.9967
optical_flow |  0.0001  0.0001 |  0.0272  0.0267 | -0.9215 -1.3756 |  1.1972  0.9063
v_err    | -0.0097 |  0.0600 | -0.4998 |  0.1835
landing_rewards |    6.52 |    4.76 |    0.00 |   10.00
landing_margin |   -0.01 |    0.03 |   -0.08 |    0.11
tracking_rewards |  -39.42 |    9.74 |  -86.59 |  -23.54
steps    |     377 |      20 |     334 |     421
***** Episode 15546, Mean R = -42.4  Std R = 14.0  Min R = -77.3
PolicyLoss: -0.00455
Policy_Beta: 0.1
Policy_Entropy: 0.048
Policy_KL: 0.00131
Policy_SD: 0.718
Policy_lr_mult: 0.667
Steps: 1.16e+04
TotalSteps: 5.15e+06
VF_0_ExplainedVarNew: 0.928
VF_0_ExplainedVarOld: 0.919
VF_0_Loss : 0.00913


ADV1:  0.000814234961161847 0.017060669938624307 0.11622769777914807 -0.1125836409147841
ADV2:  0.0004453485133481128 0.9150665082091594 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.06    0.08    0.08
a_f      |   -0.08    0.05 |    0.67    1.84 |   -1.45   -3.11 |    1.48    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.05   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.62 |    0.40 |   -2.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.38 |    0.29 |    0.00 |    2.80
seeker_angles |   -0.00   -0.00 |    0.11    0.11 |   -0.99   -1.00 |    1.00    1.00
cs_angles | -0.0029 -0.0020 |  0.1101  0.1070 | -0.9932 -0.9960 |  0.9989  0.9955
optical_flow |  0.0003  0.0001 |  0.0282  0.0260 | -1.3002 -0.9319 |  1.1442  1.0522
v_err    | -0.0090 |  0.0597 | -0.4761 |  0.1610
landing_rewards |    6.39 |    4.80 |    0.00 |   10.00
landing_margin |   -0.01 |    0.03 |   -0.08 |    0.08
tracking_rewards |  -36.97 |    7.59 |  -66.98 |  -23.96
steps    |     375 |  

attitude |    0.08   -0.05    0.01 |    1.20    0.68    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.07    0.08    0.09
a_f      |   -0.04    0.06 |    0.67    1.85 |   -1.50   -3.14 |    1.50    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.04 |    0.04    0.04    0.03
w_rewards |   -0.66 |    0.42 |   -2.33 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.38 |    0.30 |    0.00 |    2.50
seeker_angles |    0.01    0.00 |    0.11    0.11 |   -1.00   -1.00 |    1.00    0.97
cs_angles |  0.0063  0.0049 |  0.1114  0.1123 | -0.9988 -0.9958 |  0.9978  0.9749
optical_flow |  0.0003 -0.0001 |  0.0275  0.0268 | -1.1622 -1.3567 |  0.9928  1.4253
v_err    | -0.0098 |  0.0603 | -0.4893 |  0.1858
landing_rewards |    6.16 |    4.86 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.09    0.09
a_f      |   -0.05    0.08 |    0.63    1.85 |   -1.46   -3.12 |    1.41    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.67 |    0.45 |   -2.17 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.38 |    0.30 |    0.00 |    2.72
seeker_angles |    0.01    0.00 |    0.11    0.11 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0077  0.0025 |  0.1101  0.1081 | -0.9918 -0.9988 |  1.0000  0.9911
optical_flow |  0.0002  0.0001 |  0.0284  0.0262 | -1.2666 -0.8738 |  1.2284  1.3102
v_err    | -0.0096 |  0.0599 | -0.4997 |  0.1663
landing_rewards |    6.97 |    4.60 |    0.00 |   10.00
landing_margin |   -0.01 |    0.03 |   -0.08 |    0.09
tracking_rewards |  -36.48 |    8.15 |  -87.15 |  -22.81
steps    |     374 |  

norm_thrust |    1.12 |    0.72 |    0.00 |    3.46
fuel     |    2.11 |    0.25 |    1.47 |    3.07
rewards  |  -35.45 |   10.04 |  -72.53 |  -18.37
fuel_rewards |   -6.03 |    0.72 |   -8.80 |   -4.21
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.78 |   12.45 |    0.01 |  249.70
norm_af  |    1.73 |    0.89 |    0.05 |    3.27
norm_wf  |    0.02 |    0.01 |    0.01 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.05   -0.00   -0.13 |    1.27    0.69    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.07    0.08    0.09
a_f      |    0.00   -0.20 |    0.68    1.81 |   -1.51   -3.14 |    1.55    3.10
w_f      |    0.00    0.00    0.00 |    0.01    0.02    0.01 |   -0.

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0037   6.6368   2.2852   2.4929
Update Cnt = 550    ET =    907.4   Stats:  Mean, Std, Min, Max
r_f      |   -1.26  -23.74    1.16 |  189.36  178.71  198.62 | -382.56 -606.32 -385.11 |  388.24  371.44  387.31
v_f      |    0.00    0.01   -0.00 |    0.05    0.05    0.06 |   -0.15   -0.13   -0.14 |    0.33    0.36    0.16
r_i      |  -33.33  -69.63    3.74 |  693.68  659.57  760.92 |-1321.17-1231.13-1327.30 | 1364.90 1265.28 1279.16
v_i      |    0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.08   -0.10 |    0.10    0.10    0.10
norm_rf  |    1.65 |   18.89 |    0.12 |  333.76
norm_vf  |    0.09 |    0.04 |    0.03 |    0.51
gs_f     |    1.16 |    1.42 |    0.01 |   10.72
thrust   |   -0.00   -0.01   -0.00 |    0.77    0.78    0.77 |   -3.46   -3.39   -3.44 |    3.42    3.44    3.46
norm_thrust |    1.12 |    0.73 |    0.00 |    3.46
fuel     |    2.08 |    0.24 |    1.57 |    3.04
rewards  |  -36.08 |

ADV1:  -0.00028091542852721037 0.014380928464259922 0.08393158627994138 -0.11256205071287997
ADV2:  0.006601247036396959 0.9276433117456166 3.0 -3.0
 *** BROKE ***   7 0.004891369491815567
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :  11.2305   6.6061  17.7841  17.7841  11.2305   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0004   0.0018   6.6368   2.2852   2.4929
***** Episode 17375, Mean R = -33.6  Std R = 8.6  Min R = -52.7
PolicyLoss: 0.011
Policy_Beta: 0.0198
Policy_Entropy: 0.0765
Policy_KL: 0.00489
Policy_SD: 0.629
Policy_lr_mult: 0.444
Steps: 1.18e+04
TotalSteps: 5.84e+06
VF_0_ExplainedVarNew: 0.956
VF_0_ExplainedVarOld: 0.954
VF_0_Loss : 0.0108


ADV1:  0.0024622953260523034 0.01698783196644253 0.13571685827566132 -0.09554367038104694
ADV2:  -0.00868965629648607 0.8906127348216483 3.0 -3.0
 *** BROKE ***   11 0.004303773399442434
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :  12.6542   4.1832  17.0037  17.7841  12.6542   6.6061
ValFun  Gradients:

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0104   0.0036   0.0184   6.6368   2.2852   2.4929
***** Episode 17623, Mean R = -31.8  Std R = 7.6  Min R = -51.3
PolicyLoss: -0.00279
Policy_Beta: 0.0759
Policy_Entropy: 0.0745
Policy_KL: 0.00058
Policy_SD: 0.64
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 5.93e+06
VF_0_ExplainedVarNew: 0.965
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.00905


ADV1:  -0.001456944414993555 0.015149213670063019 0.07961230627544871 -0.1662448102528512
ADV2:  0.013080680439212745 0.9085934307023233 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9291   0.4936   2.4707  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0010   0.0043   6.6368   2.2852   2.4929
***** Episode 17654, Mean R = -33.4  Std R = 8.9  Min R = -53.9
PolicyLoss: -0.0075
Policy_Beta: 0.0759
Policy_Entropy: 0.0737
Policy_KL: 0.000643
Policy_SD: 0.651
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 5.94e+06
VF_0_ExplainedVarNew: 

ADV1:  -0.004858360201085977 0.0332921514484575 0.3030854462449864 -0.27751105764712514
ADV2:  0.008115618437605613 0.8521353714241787 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7741   0.3215   1.6392  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0061   0.0039   0.0155   6.6368   2.2852   2.4929
***** Episode 17902, Mean R = -37.0  Std R = 14.1  Min R = -72.8
PolicyLoss: -0.00251
Policy_Beta: 0.114
Policy_Entropy: 0.0754
Policy_KL: 0.0014
Policy_SD: 0.65
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 6.03e+06
VF_0_ExplainedVarNew: 0.912
VF_0_ExplainedVarOld: 0.825
VF_0_Loss : 0.0322


ADV1:  0.0011425758166637013 0.02194422347256933 0.1860113435563021 -0.16830584294192177
ADV2:  0.004122039346091396 0.8836170895874466 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9054   0.4693   2.2544  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0019   0.0071   6.6368   2.2852   2.4929
*

ADV1:  -0.0019176316595021213 0.016278708320795136 0.11003423828379828 -0.12352608175539435
ADV2:  0.013122473428370836 0.9349509409094094 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5665   0.2430   1.2479  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0039   0.0016   0.0064   6.6368   2.2852   2.4929
***** Episode 18181, Mean R = -32.4  Std R = 9.2  Min R = -61.7
PolicyLoss: -0.00747
Policy_Beta: 0.114
Policy_Entropy: 0.0765
Policy_KL: 0.0011
Policy_SD: 0.631
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 6.14e+06
VF_0_ExplainedVarNew: 0.939
VF_0_ExplainedVarOld: 0.935
VF_0_Loss : 0.0309


ADV1:  0.0027160422025516123 0.015003906148511867 0.11596024227502144 -0.0894290345712022
ADV2:  -0.006922210506452968 0.9160018154657403 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9854   0.5110   2.3491  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0058   0.0018   0.0095   6.6368   2.2852   2.

***** Episode 18429, Mean R = -34.1  Std R = 9.0  Min R = -56.9
PolicyLoss: -0.0111
Policy_Beta: 0.0759
Policy_Entropy: 0.0762
Policy_KL: 0.000618
Policy_SD: 0.645
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 6.23e+06
VF_0_ExplainedVarNew: 0.953
VF_0_ExplainedVarOld: 0.95
VF_0_Loss : 0.0284


ADV1:  -0.0007604254849132105 0.01646642902219789 0.09347613667448365 -0.13285332858358712
ADV2:  0.011282207622420815 0.9123684852102195 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6931   0.3569   1.6839  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0006   0.0025   6.6368   2.2852   2.4929
***** Episode 18460, Mean R = -35.6  Std R = 10.3  Min R = -69.1
PolicyLoss: -0.0105
Policy_Beta: 0.0759
Policy_Entropy: 0.0771
Policy_KL: 0.00078
Policy_SD: 0.653
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 6.24e+06
VF_0_ExplainedVarNew: 0.953
VF_0_ExplainedVarOld: 0.949
VF_0_Loss : 0.0345


ADV1:  0.0007010927875920978 0.01629054055114537

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8961   0.3638   1.9063  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0038   0.0018   0.0064   6.6368   2.2852   2.4929
***** Episode 18708, Mean R = -32.7  Std R = 9.9  Min R = -53.5
PolicyLoss: -0.0115
Policy_Beta: 0.114
Policy_Entropy: 0.0772
Policy_KL: 0.00151
Policy_SD: 0.646
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 6.33e+06
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.956
VF_0_Loss : 0.0312


ADV1:  -0.0007931759014474788 0.01753565433612148 0.12113214691040014 -0.22855721945719354
ADV2:  0.012894497997198938 0.8304369150191533 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0147   0.4440   2.3713  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0029   6.6368   2.2852   2.4929
***** Episode 18739, Mean R = -32.7  Std R = 7.8  Min R = -54.1
PolicyLoss: -0.0132
Policy_Beta: 0.114
Policy_Entropy: 0.0775
Policy_KL: 0.00155

ADV1:  0.0038258700807374713 0.015379288725860814 0.07018994599580769 -0.09029191567357164
ADV2:  -0.012418916674044083 0.936825573362902 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0534   0.6086   3.1131  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0052   0.0031   0.0120   6.6368   2.2852   2.4929
***** Episode 18987, Mean R = -31.7  Std R = 7.8  Min R = -48.0
PolicyLoss: -0.00935
Policy_Beta: 0.114
Policy_Entropy: 0.0792
Policy_KL: 0.00118
Policy_SD: 0.629
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 6.44e+06
VF_0_ExplainedVarNew: 0.947
VF_0_ExplainedVarOld: 0.943
VF_0_Loss : 0.0267


ADV1:  -0.00036157722848583477 0.01700125170319171 0.19065167069435124 -0.12084701141708587
ADV2:  0.004091736376220742 0.9201624299856064 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3903   0.8071   3.6040  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0010   0.0043   6.6368   2.2852   2

cs_angles |  0.0004  0.0037 |  0.1090  0.1060 | -0.9978 -0.9909 |  0.9936  0.9991
optical_flow | -0.0001  0.0003 |  0.0285  0.0260 | -1.4908 -1.4281 |  0.9997  1.1740
v_err    | -0.0092 |  0.0591 | -0.4820 |  0.1594
landing_rewards |    6.29 |    4.83 |    0.00 |   10.00
landing_margin |    2.73 |   48.10 |   -0.08 |  848.27
tracking_rewards |  -34.55 |    8.95 |  -92.29 |   -7.30
steps    |     371 |      29 |      10 |     422
***** Episode 19266, Mean R = -38.1  Std R = 16.1  Min R = -92.9
PolicyLoss: 0.00689
Policy_Beta: 0.0759
Policy_Entropy: 0.0814
Policy_KL: 0.000773
Policy_SD: 0.644
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 6.54e+06
VF_0_ExplainedVarNew: 0.948
VF_0_ExplainedVarOld: 0.936
VF_0_Loss : 0.0262


ADV1:  0.0010391807398266058 0.02164382498019698 0.3785216109135512 -0.2538558110825735
ADV2:  0.0012359641197363092 0.8294731770469773 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9274   0.5713   2.5374  17.7841  13.7419   6.6061
ValFun  Gradients:

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |    0.06   -0.27 |    0.67    1.82 |   -1.39   -3.14 |    1.53    3.13
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.62 |    0.38 |   -2.22 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.29 |    0.00 |    2.63
seeker_angles |   -0.00    0.00 |    0.11    0.10 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0019  0.0003 |  0.1075  0.1011 | -0.9968 -0.9969 |  0.9983  0.9990
optical_flow | -0.0000  0.0002 |  0.0267  0.0260 | -1.0212 -1.0742 |  1.2667  0.9188
v_err    | -0.0090 |  0.0594 | -0.4532 |  0.1536
landing_rewards |    6.77 |    4.67 |    0.00 |   10.00
landing_margin |   -0.01 |    0.03 |   -0.07 |    0.11
tracking_rewards |  -34.40 |    8.05 |  -96.71 |  -21.18
steps    |     374 |  

attitude |    0.02    0.04   -0.12 |    1.20    0.67    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.11   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |    0.02   -0.04 |    0.69    1.82 |   -1.52   -3.14 |    1.41    3.13
w_f      |    0.00   -0.00   -0.00 |    0.02    0.02    0.01 |   -0.11   -0.04   -0.03 |    0.04    0.05    0.04
w_rewards |   -0.62 |    0.41 |   -2.09 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.38 |    0.30 |    0.00 |    2.80
seeker_angles |    0.00    0.00 |    0.11    0.11 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0001  0.0048 |  0.1078  0.1100 | -0.9925 -0.9968 |  0.9983  0.9885
optical_flow |  0.0001  0.0002 |  0.0286  0.0266 | -1.1097 -1.2462 |  1.4646  1.0112
v_err    | -0.0087 |  0.0588 | -0.4982 |  0.1583
landing_rewards |    7.48 |    4.34 |    0.00 |   10.00
landing_margin |    2

attitude |    0.00    0.02    0.10 |    1.20    0.63    1.83 |   -3.14   -1.52   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.07    0.09    0.08
a_f      |    0.02    0.07 |    0.64    1.85 |   -1.47   -3.13 |    1.50    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.04   -0.03 |    0.04    0.05    0.03
w_rewards |   -0.59 |    0.39 |   -2.16 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.36 |    0.30 |    0.00 |    2.88
seeker_angles |   -0.00    0.01 |    0.11    0.10 |   -0.99   -1.00 |    1.00    0.99
cs_angles | -0.0021  0.0057 |  0.1060  0.1048 | -0.9872 -0.9978 |  0.9975  0.9913
optical_flow |  0.0001  0.0002 |  0.0290  0.0265 | -1.4398 -1.0430 |  1.3445  1.0701
v_err    | -0.0098 |  0.0596 | -0.4779 |  0.4092
landing_rewards |    7.35 |    4.41 |    0.00 |   10.00
landing_margin |    5

attitude |   -0.08    0.06   -0.08 |    1.16    0.66    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.10    0.08
a_f      |    0.05   -0.08 |    0.67    1.82 |   -1.50   -3.14 |    1.46    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.05   -0.03 |    0.04    0.05    0.04
w_rewards |   -0.61 |    0.42 |   -2.63 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.30 |    0.00 |    2.59
seeker_angles |    0.01    0.00 |    0.10    0.11 |   -1.00   -0.99 |    1.00    1.00
cs_angles |  0.0053  0.0050 |  0.1035  0.1052 | -0.9960 -0.9867 |  0.9986  0.9953
optical_flow | -0.0001  0.0000 |  0.0276  0.0289 | -1.2612 -1.5158 |  1.4336  1.0451
v_err    | -0.0087 |  0.0586 | -0.4998 |  0.1716
landing_rewards |    6.81 |    4.66 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.01   -0.04   -0.08 |    1.22    0.63    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.53    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.07    0.09    0.08
a_f      |   -0.02   -0.19 |    0.64    1.86 |   -1.57   -3.14 |    1.42    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.04    0.04    0.05
w_rewards |   -0.64 |    0.40 |   -2.21 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.30 |    0.00 |    2.85
seeker_angles |    0.00    0.01 |    0.11    0.10 |   -1.00   -0.98 |    1.00    1.00
cs_angles |  0.0040  0.0071 |  0.1050  0.1043 | -0.9973 -0.9811 |  0.9983  0.9977
optical_flow |  0.0001  0.0003 |  0.0285  0.0285 | -1.0709 -1.2133 |  1.2521  1.1107
v_err    | -0.0088 |  0.0588 | -0.4633 |  0.1630
landing_rewards |    6.90 |    4.62 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.08    0.09
a_f      |   -0.06   -0.13 |    0.66    1.81 |   -1.51   -3.14 |    1.48    3.12
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.04    0.04
w_rewards |   -0.67 |    0.41 |   -2.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.31 |    0.00 |    2.81
seeker_angles |    0.00    0.00 |    0.11    0.10 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0048  0.0036 |  0.1077  0.1042 | -0.9990 -0.9940 |  0.9966  0.9914
optical_flow |  0.0000  0.0002 |  0.0297  0.0274 | -1.0593 -0.9207 |  1.2769  1.4221
v_err    | -0.0087 |  0.0588 | -0.4529 |  0.1880
landing_rewards |    7.10 |    4.54 |    0.00 |   10.00
landing_margin |   -0.01 |    0.03 |   -0.08 |    0.11
tracking_rewards |  -33.62 |    7.76 |  -71.84 |  -20.58
steps    |     374 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.09    0.08
a_f      |   -0.02   -0.11 |    0.69    1.87 |   -1.54   -3.13 |    1.51    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.04    0.03
w_rewards |   -0.68 |    0.45 |   -2.86 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.31 |    0.00 |    2.66
seeker_angles |    0.00    0.00 |    0.11    0.11 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0036  0.0044 |  0.1098  0.1065 | -0.9974 -0.9961 |  0.9991  0.9966
optical_flow |  0.0002  0.0002 |  0.0273  0.0284 | -1.1849 -1.2077 |  1.3085  1.2381
v_err    | -0.0088 |  0.0587 | -0.5000 |  0.1711
landing_rewards |    7.45 |    4.36 |    0.00 |   10.00
landing_margin |   -0.01 |    0.03 |   -0.08 |    0.09
tracking_rewards |  -33.78 |    7.82 |  -68.39 |  -20.29
steps    |     372 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |    0.01    0.06 |    0.66    1.85 |   -1.48   -3.11 |    1.52    3.12
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.04   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.63 |    0.42 |   -2.72 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.30 |    0.00 |    2.70
seeker_angles |    0.01    0.00 |    0.11    0.10 |   -0.98   -1.00 |    1.00    0.99
cs_angles |  0.0068  0.0042 |  0.1097  0.1025 | -0.9839 -0.9996 |  0.9952  0.9852
optical_flow |  0.0002  0.0003 |  0.0291  0.0261 | -1.1059 -1.4317 |  1.2697  1.2218
v_err    | -0.0078 |  0.0583 | -0.4528 |  0.1545
landing_rewards |    7.32 |    4.43 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.08 |    0.06
tracking_rewards |  -33.36 |    8.01 |  -76.11 |  -19.95
steps    |     370 |  

attitude |   -0.03    0.00   -0.10 |    1.25    0.65    1.93 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.08    0.09
a_f      |   -0.00   -0.14 |    0.63    1.96 |   -1.55   -3.12 |    1.49    3.11
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.67 |    0.44 |   -2.57 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.30 |    0.00 |    2.88
seeker_angles |    0.00    0.01 |    0.11    0.10 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0026  0.0086 |  0.1089  0.1032 | -0.9967 -0.9903 |  0.9929  0.9992
optical_flow | -0.0000  0.0001 |  0.0286  0.0268 | -1.3085 -1.3923 |  1.1130  0.9650
v_err    | -0.0083 |  0.0583 | -0.5001 |  0.1924
landing_rewards |    7.35 |    4.41 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04    0.06   -0.10 |    1.18    0.64    1.88 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.06   -0.05 |    0.08    0.08    0.08
a_f      |    0.07    0.03 |    0.64    1.90 |   -1.47   -3.14 |    1.48    3.12
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.06   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.63 |    0.39 |   -2.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.30 |    0.00 |    2.54
seeker_angles |    0.00    0.00 |    0.11    0.10 |   -0.99   -0.99 |    0.99    1.00
cs_angles |  0.0047  0.0042 |  0.1063  0.1000 | -0.9947 -0.9916 |  0.9924  0.9982
optical_flow |  0.0001  0.0001 |  0.0272  0.0271 | -0.9521 -1.0851 |  1.5713  1.2298
v_err    | -0.0085 |  0.0580 | -0.4789 |  0.1438
landing_rewards |    7.84 |    4.12 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.02    0.05    0.17 |    1.20    0.62    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.08    0.08    0.09
a_f      |    0.05    0.17 |    0.62    1.91 |   -1.35   -3.12 |    1.44    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.04 |    0.04    0.04    0.03
w_rewards |   -0.67 |    0.44 |   -3.30 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.30 |    0.00 |    2.83
seeker_angles |    0.01    0.01 |    0.10    0.10 |   -0.96   -1.00 |    0.99    0.99
cs_angles |  0.0052  0.0050 |  0.1036  0.1027 | -0.9630 -0.9964 |  0.9943  0.9912
optical_flow |  0.0000  0.0000 |  0.0294  0.0272 | -1.3124 -1.0506 |  1.3490  1.1458
v_err    | -0.0089 |  0.0581 | -0.4681 |  0.1770
landing_rewards |    7.39 |    4.39 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.09    0.08
a_f      |   -0.05    0.08 |    0.63    1.84 |   -1.35   -3.12 |    1.37    3.14
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.05    0.04    0.03
w_rewards |   -0.64 |    0.40 |   -2.36 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.30 |    0.00 |    2.54
seeker_angles |    0.00    0.01 |    0.10    0.10 |   -0.96   -1.00 |    0.99    1.00
cs_angles |  0.0050  0.0053 |  0.1027  0.1015 | -0.9580 -0.9987 |  0.9946  0.9974
optical_flow | -0.0000  0.0001 |  0.0275  0.0274 | -1.4877 -1.2706 |  1.2520  1.4422
v_err    | -0.0088 |  0.0582 | -0.4578 |  0.1563
landing_rewards |    7.35 |    4.41 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.07 |    0.09
tracking_rewards |  -32.38 |    6.82 |  -56.17 |  -20.40
steps    |     375 |  

attitude |   -0.07   -0.07   -0.20 |    1.26    0.70    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.07    0.08    0.08
a_f      |   -0.07   -0.20 |    0.71    1.87 |   -1.46   -3.12 |    1.51    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.64 |    0.43 |   -3.10 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.30 |    0.00 |    2.75
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -0.99   -1.00 |    0.99    1.00
cs_angles |  0.0066  0.0039 |  0.1030  0.1018 | -0.9924 -0.9977 |  0.9930  0.9987
optical_flow | -0.0001  0.0003 |  0.0287  0.0292 | -1.8543 -1.4655 |  1.2338  1.4251
v_err    | -0.0086 |  0.0586 | -0.4527 |  0.1552
landing_rewards |    7.16 |    4.51 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.15    0.02    0.02 |    1.27    0.65    1.93 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |    0.04    0.07 |    0.66    1.94 |   -1.42   -3.13 |    1.48    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.04 |    0.04    0.03    0.03
w_rewards |   -0.65 |    0.37 |   -2.15 |   -0.02
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.30 |    0.00 |    2.57
seeker_angles |    0.01    0.01 |    0.11    0.10 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0051  0.0051 |  0.1051  0.0992 | -0.9963 -0.9990 |  0.9996  0.9986
optical_flow | -0.0001  0.0004 |  0.0272  0.0270 | -1.2329 -1.0733 |  1.1286  1.0153
v_err    | -0.0083 |  0.0580 | -0.4994 |  0.1495
landing_rewards |    6.90 |    4.62 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.10    0.06   -0.02 |    1.24    0.64    1.89 |   -3.14   -1.53   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.09    0.08    0.08
a_f      |    0.07    0.07 |    0.61    1.88 |   -1.39   -3.14 |    1.40    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.03 |    0.03    0.04    0.04
w_rewards |   -0.65 |    0.41 |   -2.23 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.29 |    0.00 |    2.65
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0055  0.0036 |  0.1010  0.1028 | -0.9999 -0.9987 |  0.9935  0.9972
optical_flow | -0.0000  0.0000 |  0.0276  0.0280 | -1.2032 -1.1019 |  1.1875  1.2982
v_err    | -0.0084 |  0.0581 | -0.4978 |  0.1354
landing_rewards |    7.10 |    4.54 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.01   -0.03    0.04 |    1.25    0.67    1.87 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.08    0.08    0.09
a_f      |   -0.01   -0.03 |    0.66    1.87 |   -1.43   -3.12 |    1.43    3.12
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.04   -0.03 |    0.04    0.05    0.03
w_rewards |   -0.69 |    0.47 |   -3.50 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.30 |    0.00 |    2.83
seeker_angles |   -0.00    0.01 |    0.10    0.10 |   -0.99   -0.99 |    1.00    0.99
cs_angles | -0.0010  0.0052 |  0.1039  0.1005 | -0.9871 -0.9941 |  0.9960  0.9896
optical_flow | -0.0002  0.0001 |  0.0284  0.0276 | -1.1478 -1.1098 |  1.7097  1.3910
v_err    | -0.0091 |  0.0582 | -0.4531 |  0.1581
landing_rewards |    7.87 |    4.09 |    0.00 |   10.00
landing_margin |    2

attitude |    0.00    0.05    0.01 |    1.11    0.66    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |    0.05    0.03 |    0.65    1.83 |   -1.45   -3.14 |    1.38    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.68 |    0.41 |   -2.49 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.30 |    0.00 |    2.59
seeker_angles |    0.00    0.01 |    0.11    0.10 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0046  0.0065 |  0.1051  0.0996 | -0.9982 -0.9936 |  0.9968  0.9920
optical_flow | -0.0000  0.0003 |  0.0278  0.0264 | -1.0885 -0.9001 |  1.3363  1.3470
v_err    | -0.0093 |  0.0579 | -0.4679 |  0.1661
landing_rewards |    7.65 |    4.24 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.06    0.08    0.09
a_f      |   -0.08    0.10 |    0.69    1.79 |   -1.48   -3.10 |    1.47    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.04   -0.03 |    0.03    0.04    0.03
w_rewards |   -0.70 |    0.43 |   -2.06 |   -0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.35 |    0.30 |    0.00 |    2.55
seeker_angles |    0.00    0.00 |    0.10    0.11 |   -1.00   -1.00 |    0.99    0.99
cs_angles |  0.0018  0.0044 |  0.1017  0.1067 | -0.9995 -0.9997 |  0.9879  0.9886
optical_flow | -0.0002  0.0001 |  0.0290  0.0273 | -1.3174 -1.2836 |  1.0660  0.9954
v_err    | -0.0091 |  0.0583 | -0.4989 |  0.2017
landing_rewards |    7.74 |    4.18 |    0.00 |   10.00
landing_margin |    3.13 |   54.18 |   -0.08 |  955.37
tracking_rewards |  -32.32 |    8.67 | -104.97 |   -7.68
steps    |     375 |  

attitude |   -0.04    0.00    0.05 |    1.17    0.63    1.87 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.07    0.08    0.08
a_f      |    0.01   -0.02 |    0.63    1.88 |   -1.48   -3.14 |    1.46    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.05   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.69 |    0.40 |   -2.74 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.29 |    0.00 |    2.47
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0011  0.0040 |  0.0969  0.1016 | -0.9946 -0.9990 |  0.9851  0.9927
optical_flow | -0.0000  0.0001 |  0.0287  0.0280 | -1.3941 -1.2022 |  1.0389  1.0535
v_err    | -0.0095 |  0.0574 | -0.4539 |  0.1646
landing_rewards |    7.74 |    4.18 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01    0.05   -0.08 |    1.20    0.66    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.07    0.08    0.08
a_f      |    0.04   -0.05 |    0.66    1.87 |   -1.42   -3.13 |    1.52    3.13
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.03    0.04    0.03
w_rewards |   -0.67 |    0.45 |   -3.75 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.30 |    0.00 |    2.79
seeker_angles |    0.00    0.01 |    0.10    0.10 |   -0.99   -1.00 |    1.00    0.98
cs_angles |  0.0029  0.0052 |  0.1013  0.1003 | -0.9913 -0.9981 |  0.9998  0.9798
optical_flow | -0.0001  0.0001 |  0.0273  0.0269 | -0.8299 -1.2473 |  1.0094  1.1471
v_err    | -0.0094 |  0.0577 | -0.4926 |  0.1420
landing_rewards |    7.71 |    4.20 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.03    0.02   -0.11 |    1.33    0.68    1.96 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.08    0.08
a_f      |    0.03   -0.15 |    0.69    1.93 |   -1.44   -3.14 |    1.44    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.05   -0.04 |    0.04    0.03    0.02
w_rewards |   -0.62 |    0.37 |   -1.88 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.30 |    0.00 |    2.75
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -1.00   -1.00 |    0.99    0.99
cs_angles |  0.0058  0.0027 |  0.1033  0.0988 | -0.9980 -0.9970 |  0.9941  0.9893
optical_flow | -0.0000  0.0001 |  0.0287  0.0280 | -1.4777 -1.0349 |  1.1504  1.2578
v_err    | -0.0097 |  0.0570 | -0.4534 |  0.1482
landing_rewards |    7.81 |    4.14 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.09    0.08    0.08
a_f      |   -0.02    0.01 |    0.69    1.77 |   -1.45   -3.13 |    1.53    3.07
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.05   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.61 |    0.40 |   -2.39 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.30 |    0.00 |    2.82
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -0.97   -1.00 |    1.00    1.00
cs_angles |  0.0052  0.0019 |  0.0974  0.0993 | -0.9666 -0.9987 |  0.9993  0.9999
optical_flow | -0.0000  0.0002 |  0.0263  0.0289 | -1.2219 -1.1281 |  1.3723  1.1967
v_err    | -0.0094 |  0.0572 | -0.4999 |  0.1560
landing_rewards |    7.16 |    4.51 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.08 |    0.05
tracking_rewards |  -30.33 |    6.51 |  -58.00 |  -18.42
steps    |     375 |  

attitude |    0.01   -0.01   -0.04 |    1.20    0.66    1.80 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.08    0.08
a_f      |   -0.00   -0.10 |    0.66    1.80 |   -1.52   -3.14 |    1.54    3.13
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.05   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.62 |    0.39 |   -2.32 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.30 |    0.00 |    2.52
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -1.00   -0.98 |    0.97    0.99
cs_angles |  0.0018  0.0014 |  0.1014  0.0997 | -1.0000 -0.9831 |  0.9748  0.9923
optical_flow | -0.0001  0.0001 |  0.0283  0.0270 | -1.2135 -1.3800 |  1.0868  1.0873
v_err    | -0.0092 |  0.0575 | -0.5002 |  0.1692
landing_rewards |    7.39 |    4.39 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.09    0.08    0.08
a_f      |   -0.06    0.10 |    0.67    1.90 |   -1.48   -3.10 |    1.43    3.11
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.04   -0.04 |    0.04    0.04    0.03
w_rewards |   -0.59 |    0.39 |   -2.29 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.30 |    0.00 |    2.65
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -0.99   -0.97 |    0.99    1.00
cs_angles |  0.0033  0.0021 |  0.0999  0.0982 | -0.9945 -0.9711 |  0.9947  0.9970
optical_flow | -0.0000  0.0004 |  0.0271  0.0271 | -1.1123 -1.2987 |  1.0841  1.1776
v_err    | -0.0087 |  0.0576 | -0.4519 |  0.1364
landing_rewards |    7.68 |    4.22 |    0.00 |   10.00
landing_margin |    3.09 |   54.67 |   -0.07 |  964.17
tracking_rewards |  -30.15 |    6.52 |  -54.67 |  -10.38
steps    |     372 |  

attitude |   -0.10    0.12   -0.02 |    1.28    0.65    1.88 |   -3.14   -1.53   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.07    0.09    0.08
a_f      |    0.12    0.07 |    0.65    1.86 |   -1.47   -3.13 |    1.52    3.13
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.02 |    0.04    0.04    0.03
w_rewards |   -0.58 |    0.40 |   -2.21 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.30 |    0.00 |    2.96
seeker_angles |    0.00    0.01 |    0.10    0.09 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0026  0.0060 |  0.1022  0.0946 | -0.9930 -0.9982 |  0.9960  0.9964
optical_flow |  0.0000  0.0001 |  0.0271  0.0273 | -1.2138 -1.7683 |  1.2759  0.8992
v_err    | -0.0082 |  0.0578 | -0.5002 |  0.1472
landing_rewards |    7.55 |    4.30 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.10    0.08    0.08
a_f      |    0.03    0.01 |    0.65    1.88 |   -1.50   -3.13 |    1.54    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.02 |    0.04    0.04    0.04
w_rewards |   -0.59 |    0.44 |   -2.93 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.30 |    0.00 |    2.70
seeker_angles |    0.01    0.01 |    0.10    0.10 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0053  0.0053 |  0.1020  0.1000 | -0.9943 -0.9950 |  0.9865  0.9941
optical_flow |  0.0001  0.0001 |  0.0269  0.0267 | -0.9056 -1.0939 |  1.2304  1.1744
v_err    | -0.0086 |  0.0580 | -0.4522 |  0.1776
landing_rewards |    7.39 |    4.39 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.07 |    0.13
tracking_rewards |  -31.18 |    6.51 |  -58.07 |  -19.04
steps    |     374 |  

attitude |   -0.12    0.01    0.02 |    1.20    0.65    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.08    0.08
a_f      |    0.01   -0.04 |    0.64    1.87 |   -1.53   -3.14 |    1.52    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.04    0.03
w_rewards |   -0.53 |    0.40 |   -2.83 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.29 |    0.00 |    2.77
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0072  0.0007 |  0.0974  0.0976 | -0.9989 -0.9926 |  0.9866  0.9995
optical_flow |  0.0001  0.0002 |  0.0282  0.0282 | -1.2607 -1.3008 |  1.0610  1.3321
v_err    | -0.0084 |  0.0572 | -0.4518 |  0.1402
landing_rewards |    7.65 |    4.24 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.10    0.08    0.08
a_f      |    0.01    0.13 |    0.65    1.83 |   -1.30   -3.13 |    1.49    3.13
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.10    0.04    0.04
w_rewards |   -0.54 |    0.39 |   -2.03 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.29 |    0.00 |    3.01
seeker_angles |    0.00    0.00 |    0.10    0.09 |   -1.00   -0.99 |    1.00    1.00
cs_angles |  0.0048  0.0010 |  0.0959  0.0944 | -0.9994 -0.9941 |  0.9989  0.9983
optical_flow | -0.0001  0.0002 |  0.0289  0.0268 | -1.3013 -1.0409 |  1.1770  1.0821
v_err    | -0.0088 |  0.0569 | -0.4998 |  0.1516
landing_rewards |    7.65 |    4.24 |    0.00 |   10.00
landing_margin |    2.71 |   47.97 |   -0.08 |  846.02
tracking_rewards |  -29.19 |    5.93 |  -50.85 |   -7.86
steps    |     373 |  

attitude |   -0.06    0.01   -0.10 |    1.17    0.67    1.76 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.10    0.08    0.08
a_f      |    0.02   -0.10 |    0.67    1.75 |   -1.41   -3.11 |    1.50    3.14
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.10    0.04    0.03
w_rewards |   -0.62 |    0.45 |   -2.65 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.30 |    0.00 |    2.56
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0050  0.0022 |  0.0972  0.1020 | -0.9961 -0.9997 |  0.9929  0.9974
optical_flow | -0.0002  0.0002 |  0.0278  0.0270 | -1.1231 -1.4820 |  1.2366  1.0734
v_err    | -0.0090 |  0.0573 | -0.4675 |  0.1300
landing_rewards |    7.77 |    4.16 |    0.00 |   10.00
landing_margin |    2

attitude |   -0.04   -0.05   -0.13 |    1.24    0.67    1.88 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.09    0.08    0.09
a_f      |   -0.06   -0.18 |    0.66    1.88 |   -1.41   -3.13 |    1.49    3.12
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.61 |    0.43 |   -2.50 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.30 |    0.00 |    2.76
seeker_angles |    0.01    0.00 |    0.10    0.09 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0053  0.0050 |  0.1020  0.0945 | -0.9976 -0.9991 |  0.9923  0.9973
optical_flow | -0.0000  0.0000 |  0.0278  0.0264 | -0.9730 -1.2520 |  1.3316  0.9173
v_err    | -0.0089 |  0.0574 | -0.4798 |  0.1380
landing_rewards |    8.03 |    3.98 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.07   -0.02   -0.25 |    1.28    0.68    1.96 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.09    0.08    0.09
a_f      |   -0.01   -0.25 |    0.68    1.96 |   -1.49   -3.14 |    1.48    3.13
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.10   -0.04   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.63 |    0.44 |   -2.98 |    0.00
w_penalty |   -0.65 |    8.01 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.30 |    0.00 |    3.09
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0043  0.0021 |  0.1000  0.1000 | -0.9978 -0.9925 |  0.9988  0.9948
optical_flow |  0.0002  0.0000 |  0.0270  0.0285 | -0.9416 -1.3556 |  1.1646  1.5128
v_err    | -0.0090 |  0.0576 | -0.4824 |  0.2182
landing_rewards |    7.48 |    4.34 |    0.00 |   10.00
landing_margin |    6

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.09    0.08    0.09
a_f      |   -0.07    0.15 |    0.63    1.79 |   -1.53   -3.13 |    1.41    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.04    0.03    0.03
w_rewards |   -0.59 |    0.41 |   -2.98 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.29 |    0.00 |    2.65
seeker_angles |    0.00   -0.00 |    0.10    0.10 |   -0.99   -1.00 |    0.99    1.00
cs_angles |  0.0036 -0.0020 |  0.0956  0.0962 | -0.9861 -0.9956 |  0.9896  0.9971
optical_flow | -0.0001  0.0003 |  0.0276  0.0261 | -1.1283 -1.0516 |  1.5561  1.0397
v_err    | -0.0084 |  0.0566 | -0.4534 |  0.1552
landing_rewards |    7.65 |    4.24 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.05
tracking_rewards |  -29.43 |    6.49 |  -58.90 |  -18.64
steps    |     375 |  

attitude |    0.01   -0.00    0.09 |    1.14    0.67    1.80 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.09    0.08    0.08
a_f      |    0.00   -0.02 |    0.67    1.81 |   -1.46   -3.14 |    1.53    3.13
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.62 |    0.39 |   -2.15 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.29 |    0.00 |    2.62
seeker_angles |    0.00    0.00 |    0.10    0.09 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0026  0.0025 |  0.0983  0.0949 | -0.9949 -0.9958 |  0.9982  0.9867
optical_flow | -0.0001  0.0002 |  0.0282  0.0270 | -1.1946 -0.9268 |  1.2621  1.3987
v_err    | -0.0086 |  0.0565 | -0.4526 |  0.1529
landing_rewards |    7.45 |    4.36 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.03   -0.00   -0.00 |    1.14    0.65    1.75 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |    0.01    0.07 |    0.66    1.75 |   -1.53   -3.13 |    1.40    3.12
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.05    0.04    0.03
w_rewards |   -0.57 |    0.35 |   -1.60 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.29 |    0.00 |    2.56
seeker_angles |    0.01    0.01 |    0.10    0.09 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0053  0.0051 |  0.1005  0.0929 | -0.9984 -0.9985 |  0.9992  0.9995
optical_flow |  0.0001  0.0002 |  0.0288  0.0274 | -1.4803 -0.9681 |  1.1770  1.1920
v_err    | -0.0089 |  0.0567 | -0.4530 |  0.1530
landing_rewards |    7.81 |    4.14 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.02   -0.01   -0.03 |    1.12    0.65    1.79 |   -3.14   -1.56   -3.14 |    3.14    1.53    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.10    0.08    0.08
a_f      |   -0.01   -0.01 |    0.66    1.78 |   -1.49   -3.11 |    1.49    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.58 |    0.51 |   -6.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.29 |    0.00 |    2.53
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -0.99   -0.99 |    1.00    0.99
cs_angles |  0.0039  0.0013 |  0.0972  0.0984 | -0.9934 -0.9941 |  0.9994  0.9885
optical_flow |  0.0000  0.0002 |  0.0289  0.0284 | -1.1907 -1.3052 |  1.7534  1.7903
v_err    | -0.0092 |  0.0569 | -0.4909 |  0.1516
landing_rewards |    8.03 |    3.98 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.09    0.09    0.08
a_f      |    0.02   -0.28 |    0.69    1.83 |   -1.51   -3.09 |    1.43    3.10
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.57 |    0.37 |   -1.75 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.29 |    0.00 |    2.63
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0045  0.0043 |  0.0976  0.0963 | -0.9980 -0.9892 |  0.9944  0.9980
optical_flow |  0.0000  0.0001 |  0.0279  0.0273 | -1.2744 -1.1437 |  1.2271  1.0967
v_err    | -0.0089 |  0.0566 | -0.4556 |  0.1439
landing_rewards |    7.90 |    4.07 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.07
tracking_rewards |  -29.20 |    6.39 |  -61.76 |  -18.79
steps    |     376 |  

thrust   |    0.01    0.00    0.00 |    0.71    0.71    0.71 |   -3.44   -3.46   -3.46 |    3.41    3.40    3.46
norm_thrust |    0.98 |    0.75 |    0.00 |    3.46
fuel     |    1.74 |    0.21 |    1.18 |    2.39
rewards  |  -25.86 |    7.68 |  -56.79 |  -12.86
fuel_rewards |   -4.97 |    0.61 |   -6.84 |   -3.40
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.83 |   12.52 |    0.01 |  452.52
norm_af  |    1.73 |    0.93 |    0.06 |    3.22
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.02   -0.07   -0.20 |    1.21    0.64    1.84 |   -3.14   -1.55   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.07    0.08    0.08
a_f      |   -0.06   -0.11 |    0.63

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2705   0.5324   2.4691  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0080   0.0032   0.0168   6.6368   2.2852   2.4929
Update Cnt = 1000    ET =   1069.0   Stats:  Mean, Std, Min, Max
r_f      |    3.30    0.82    8.95 |  186.69  172.46  199.93 | -387.54 -368.44 -397.51 |  378.36  369.51  376.67
v_f      |   -0.00   -0.00   -0.00 |    0.05    0.05    0.05 |   -0.11   -0.14   -0.13 |    0.18    0.11    0.12
r_i      |   -2.87    1.14   29.41 |  694.92  655.67  759.40 |-1255.60-1320.84-1340.62 | 1354.95 1304.00 1316.85
v_i      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.09    0.09
norm_rf  |    0.43 |    0.19 |    0.06 |    1.13
norm_vf  |    0.08 |    0.02 |    0.03 |    0.19
gs_f     |    1.49 |    3.53 |    0.01 |   43.40
thrust   |    0.00    0.00   -0.00 |    0.71    0.71    0.71 |   -3.36   -3.45   -3.46 |    3.46    3.41    3.46
norm_thrust |    

ADV1:  -0.0011618636409741932 0.01371816758916072 0.10463070574489941 -0.06575804440290467
ADV2:  0.003516092105915217 0.9439229651428951 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1011   0.4040   2.3543  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0012   0.0038   6.6368   2.2852   2.4929
***** Episode 31325, Mean R = -27.4  Std R = 8.0  Min R = -46.1
PolicyLoss: -0.000693
Policy_Beta: 0.114
Policy_Entropy: 0.11
Policy_KL: 0.00147
Policy_SD: 0.59
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.11e+07
VF_0_ExplainedVarNew: 0.967
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.00252


ADV1:  0.0028268432088264807 0.013084156997175203 0.0561747649496232 -0.12339639696075544
ADV2:  0.010032041702545933 0.838219768797841 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1539   0.6112   3.3507  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0043   0.0023   0.0080   6.6368   2.2852   2.492

ADV1:  0.0011667568985272785 0.01353477314632339 0.17006132523420792 -0.1438284192171041
ADV2:  -0.001815518575475243 0.8736559807446546 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0317   0.5341   2.8968  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0015   0.0077   6.6368   2.2852   2.4929
***** Episode 31604, Mean R = -25.0  Std R = 6.0  Min R = -37.1
PolicyLoss: -0.00789
Policy_Beta: 0.114
Policy_Entropy: 0.109
Policy_KL: 0.00117
Policy_SD: 0.587
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.12e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.96
VF_0_Loss : 0.00276


ADV1:  -0.0004226105512539228 0.012411874119148836 0.0858957869311997 -0.09013248000300576
ADV2:  0.0053111699075527215 0.9288440277154058 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8066   0.3422   1.7293  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0016   6.6368   2.2852   2.4

ADV1:  -0.00032234609251341993 0.01417436253319601 0.059112539144553944 -0.13253920653295714
ADV2:  0.0179382264726976 0.8824756609381834 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7878   1.3769   6.0335  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0003   0.0013   6.6368   2.2852   2.4929
***** Episode 31883, Mean R = -26.6  Std R = 10.1  Min R = -49.3
PolicyLoss: -0.02
Policy_Beta: 0.0759
Policy_Entropy: 0.106
Policy_KL: 0.000681
Policy_SD: 0.613
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.13e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.961
VF_0_Loss : 0.00209


ADV1:  0.0021243190522607985 0.012277725934359156 0.18975419977019786 -0.0650803959758337
ADV2:  -0.012994502206148513 0.8942167665731139 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3090   0.7093   3.1844  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0011   0.0054   6.6368   2.2852   2.

***** Episode 32131, Mean R = -26.5  Std R = 7.3  Min R = -45.7
PolicyLoss: -0.0133
Policy_Beta: 0.0759
Policy_Entropy: 0.108
Policy_KL: 0.000728
Policy_SD: 0.6
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.14e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.961
VF_0_Loss : 0.00278


ADV1:  -0.012501860398559432 0.1506077250374024 0.06083459027874044 -4.600410479829857
ADV2:  0.04663383985063129 0.23570883527996558 0.4742989400880976 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2036   0.0693   0.3422  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0126   0.0079   0.0300   6.6368   2.2852   2.4929
***** Episode 32162, Mean R = -32.3  Std R = 30.8  Min R = -196.1
PolicyLoss: -0.0436
Policy_Beta: 0.114
Policy_Entropy: 0.111
Policy_KL: 0.000461
Policy_SD: 0.6
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.14e+07
VF_0_ExplainedVarNew: 0.699
VF_0_ExplainedVarOld: 0.356
VF_0_Loss : 0.0148


ADV1:  0.007689336616721888 0.0195019679

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4520   0.8896   4.8009  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0007   0.0027   6.6368   2.2852   2.4929
***** Episode 32410, Mean R = -29.3  Std R = 12.1  Min R = -70.2
PolicyLoss: -0.0109
Policy_Beta: 0.114
Policy_Entropy: 0.11
Policy_KL: 0.0013
Policy_SD: 0.61
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.15e+07
VF_0_ExplainedVarNew: 0.955
VF_0_ExplainedVarOld: 0.949
VF_0_Loss : 0.00249


ADV1:  0.0018669604013417016 0.017950915659984416 0.358315274382836 -0.1392544015682804
ADV2:  -0.030642698353323488 0.6660250577529315 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8461   0.3353   1.5645  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0034   0.0012   0.0053   6.6368   2.2852   2.4929
***** Episode 32441, Mean R = -25.2  Std R = 7.5  Min R = -45.7
PolicyLoss: 0.023
Policy_Beta: 0.114
Policy_Entropy: 0.109
Policy_KL: 0.0016
Policy

ADV1:  0.0003674289306786243 0.01644004788429798 0.10156322351440128 -0.2594242534832838
ADV2:  0.007263277308027435 0.8429020854826386 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1886   0.7721   4.1659  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0021   6.6368   2.2852   2.4929
***** Episode 32689, Mean R = -25.8  Std R = 7.9  Min R = -46.5
PolicyLoss: -0.0129
Policy_Beta: 0.114
Policy_Entropy: 0.112
Policy_KL: 0.00152
Policy_SD: 0.576
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.16e+07
VF_0_ExplainedVarNew: 0.961
VF_0_ExplainedVarOld: 0.945
VF_0_Loss : 0.0013


ADV1:  0.0012756037048251552 0.04467815950992 0.8442589518505683 -0.13253740599480024
ADV2:  -0.045120160906235676 0.3863037148969393 3.0 -2.9026630236664217
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4954   0.2188   1.1777  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0021   0.0109   6.6368   2.28

***** Episode 32937, Mean R = -25.2  Std R = 7.5  Min R = -47.8
PolicyLoss: -0.00711
Policy_Beta: 0.114
Policy_Entropy: 0.116
Policy_KL: 0.00165
Policy_SD: 0.575
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.17e+07
VF_0_ExplainedVarNew: 0.967
VF_0_ExplainedVarOld: 0.963
VF_0_Loss : 0.00202


ADV1:  -0.0010728932226306946 0.01231638229666083 0.06750746025073939 -0.09985340652444019
ADV2:  0.017510059886665826 0.9061311222959411 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3183   0.6281   2.8616  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0014   0.0049   6.6368   2.2852   2.4929
***** Episode 32968, Mean R = -26.5  Std R = 6.9  Min R = -46.5
PolicyLoss: -0.015
Policy_Beta: 0.114
Policy_Entropy: 0.112
Policy_KL: 0.00159
Policy_SD: 0.596
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.17e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 0.00191


ADV1:  0.0026126515818444183 0.011340293633699691 0.

***** Episode 33216, Mean R = -28.2  Std R = 8.5  Min R = -46.9
PolicyLoss: -0.00572
Policy_Beta: 0.114
Policy_Entropy: 0.115
Policy_KL: 0.0013
Policy_SD: 0.592
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.18e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.96
VF_0_Loss : 0.00224


ADV1:  0.0014199391133846487 0.01451025832093814 0.0637251123239091 -0.22387051739313657
ADV2:  0.005882151680180729 0.8660991527445592 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9234   0.9187   5.1316  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0012   0.0044   6.6368   2.2852   2.4929
***** Episode 33247, Mean R = -24.7  Std R = 7.0  Min R = -38.9
PolicyLoss: -0.0178
Policy_Beta: 0.114
Policy_Entropy: 0.115
Policy_KL: 0.00133
Policy_SD: 0.578
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.18e+07
VF_0_ExplainedVarNew: 0.954
VF_0_ExplainedVarOld: 0.951
VF_0_Loss : 0.00194


ADV1:  0.003101158488011758 0.01263760852106117 0.0857

cs_angles | -0.0031  0.0034 |  0.0957  0.0966 | -0.9850 -0.9997 |  0.9918  0.9896
optical_flow | -0.0001  0.0001 |  0.0282  0.0276 | -1.2928 -1.0451 |  1.4641  1.2737
v_err    | -0.0094 |  0.0565 | -0.4519 |  0.1579
landing_rewards |    8.35 |    3.71 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.06
tracking_rewards |  -28.41 |    6.05 |  -53.87 |  -17.77
steps    |     375 |      20 |     336 |     417
***** Episode 33526, Mean R = -27.1  Std R = 8.6  Min R = -50.2
PolicyLoss: -0.0036
Policy_Beta: 0.114
Policy_Entropy: 0.112
Policy_KL: 0.00149
Policy_SD: 0.594
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.19e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.961
VF_0_Loss : 0.00236


ADV1:  -0.0013134302100219607 0.014394015885540509 0.06403764313705579 -0.09699771273591834
ADV2:  0.013295550945736357 0.9299990501370196 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9326   0.4470   2.1521  17.7841  13.7419   6.6061
ValFun  Gradients:

attitude |    0.00   -0.00   -0.02 |    1.22    0.69    1.80 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.09    0.07    0.08
a_f      |    0.00   -0.04 |    0.71    1.79 |   -1.48   -3.11 |    1.49    3.12
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.04    0.04    0.03
w_rewards |   -0.53 |    0.40 |   -2.52 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.30 |    0.00 |    2.92
seeker_angles |    0.00    0.01 |    0.10    0.09 |   -1.00   -0.98 |    0.99    0.98
cs_angles |  0.0036  0.0055 |  0.0971  0.0934 | -1.0000 -0.9778 |  0.9880  0.9808
optical_flow |  0.0001  0.0000 |  0.0281  0.0274 | -0.9743 -1.1127 |  1.2820  1.1348
v_err    | -0.0093 |  0.0565 | -0.4528 |  0.1423
landing_rewards |    8.26 |    3.79 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04    0.01    0.06 |    1.20    0.66    1.85 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.07    0.08
a_f      |    0.01   -0.02 |    0.67    1.83 |   -1.48   -3.13 |    1.57    3.14
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.04    0.02
w_rewards |   -0.50 |    0.35 |   -1.92 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.29 |    0.00 |    2.76
seeker_angles |    0.01    0.01 |    0.09    0.09 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0066  0.0085 |  0.0906  0.0944 | -0.9973 -0.9983 |  0.9935  0.9990
optical_flow | -0.0001  0.0001 |  0.0278  0.0282 | -1.1569 -1.4992 |  1.0874  1.0027
v_err    | -0.0096 |  0.0562 | -0.4522 |  0.1582
landing_rewards |    8.19 |    3.85 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.03   -0.03   -0.03 |    1.16    0.66    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |   -0.03    0.01 |    0.66    1.85 |   -1.39   -3.14 |    1.47    3.11
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.04 |    0.04    0.03    0.02
w_rewards |   -0.50 |    0.40 |   -2.34 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.30 |    0.00 |    2.77
seeker_angles |    0.01    0.01 |    0.09    0.10 |   -1.00   -0.99 |    1.00    1.00
cs_angles |  0.0067  0.0093 |  0.0944  0.0951 | -0.9981 -0.9911 |  0.9966  0.9984
optical_flow | -0.0000  0.0000 |  0.0278  0.0275 | -1.2973 -1.2300 |  1.1015  1.1206
v_err    | -0.0099 |  0.0562 | -0.4998 |  0.1326
landing_rewards |    8.52 |    3.55 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.10    0.08    0.08
a_f      |   -0.06   -0.04 |    0.66    1.89 |   -1.47   -3.14 |    1.56    3.14
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.10   -0.03   -0.03 |    0.10    0.03    0.04
w_rewards |   -0.53 |    0.43 |   -3.41 |    0.00
w_penalty |   -0.65 |    8.01 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.30 |    0.00 |    2.94
seeker_angles |    0.00    0.01 |    0.10    0.09 |   -1.00   -1.00 |    0.99    0.98
cs_angles |  0.0046  0.0077 |  0.0951  0.0919 | -0.9967 -0.9997 |  0.9871  0.9817
optical_flow | -0.0001 -0.0001 |  0.0276  0.0274 | -1.2203 -1.1398 |  1.1417  1.2773
v_err    | -0.0099 |  0.0557 | -0.4536 |  0.1351
landing_rewards |    8.45 |    3.62 |    0.00 |   10.00
landing_margin |    6.04 |   75.28 |   -0.08 |  974.91
tracking_rewards |  -27.85 |    5.44 |  -49.07 |   -8.97
steps    |     376 |  

attitude |    0.12   -0.01    0.17 |    1.23    0.62    1.92 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |    0.00    0.14 |    0.62    1.93 |   -1.55   -3.13 |    1.41    3.13
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.10   -0.03   -0.03 |    0.05    0.04    0.03
w_rewards |   -0.52 |    0.39 |   -2.07 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.30 |    0.00 |    3.01
seeker_angles |    0.00    0.00 |    0.09    0.10 |   -0.99   -1.00 |    0.99    0.98
cs_angles |  0.0009  0.0049 |  0.0941  0.0967 | -0.9911 -0.9960 |  0.9888  0.9806
optical_flow | -0.0000 -0.0001 |  0.0284  0.0274 | -1.2666 -1.2627 |  1.3534  1.0991
v_err    | -0.0096 |  0.0558 | -0.4535 |  0.2026
landing_rewards |    8.81 |    3.24 |    0.00 |   10.00
landing_margin |    2

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.08   -0.07 |    0.10    0.08    0.08
a_f      |   -0.08   -0.22 |    0.68    1.85 |   -1.42   -3.13 |    1.44    3.14
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.54 |    0.88 |  -14.43 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.31 |    0.31 |    0.00 |    3.05
seeker_angles |    0.01    0.00 |    0.10    0.09 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0053  0.0009 |  0.0958  0.0948 | -0.9960 -0.9967 |  0.9966  0.9996
optical_flow | -0.0001  0.0001 |  0.0278  0.0270 | -1.1811 -1.2034 |  1.4837  1.2009
v_err    | -0.0090 |  0.0569 | -0.4528 |  0.6788
landing_rewards |    8.26 |    3.79 |    0.00 |   10.00
landing_margin |    1.23 |   21.92 |   -0.06 |  386.56
tracking_rewards |  -28.20 |    7.90 | -128.52 |  -17.68
steps    |     375 |  

attitude |   -0.03   -0.03   -0.21 |    1.30    0.63    1.94 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.09    0.08    0.08
a_f      |   -0.04   -0.18 |    0.63    1.93 |   -1.46   -3.12 |    1.51    3.13
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.04    0.03    0.02
w_rewards |   -0.53 |    0.45 |   -2.69 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.31 |    0.00 |    3.03
seeker_angles |    0.01    0.00 |    0.10    0.09 |   -0.99   -0.99 |    1.00    0.97
cs_angles |  0.0058  0.0013 |  0.0977  0.0948 | -0.9927 -0.9943 |  0.9992  0.9713
optical_flow | -0.0002 -0.0001 |  0.0283  0.0264 | -1.4718 -1.1158 |  1.5592  0.9799
v_err    | -0.0090 |  0.0564 | -0.4987 |  0.2013
landing_rewards |    8.23 |    3.82 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.04    0.03    0.08 |    1.18    0.62    1.79 |   -3.14   -1.54   -3.14 |    3.14    1.53    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |    0.03    0.13 |    0.62    1.79 |   -1.44   -3.13 |    1.43    3.12
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.59 |    0.41 |   -3.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.30 |    0.00 |    2.94
seeker_angles |    0.01    0.00 |    0.09    0.09 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0078  0.0002 |  0.0948  0.0893 | -0.9987 -0.9959 |  0.9968  0.9993
optical_flow | -0.0001  0.0000 |  0.0273  0.0275 | -1.0462 -1.1183 |  0.9473  0.9813
v_err    | -0.0094 |  0.0571 | -0.4853 |  0.1476
landing_rewards |    8.32 |    3.74 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04   -0.03    0.06 |    1.18    0.68    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.08    0.07    0.08
a_f      |   -0.03   -0.01 |    0.68    1.85 |   -1.52   -3.13 |    1.53    3.10
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.05    0.04    0.02
w_rewards |   -0.53 |    0.38 |   -2.49 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.30 |    0.00 |    3.04
seeker_angles |    0.01   -0.00 |    0.10    0.09 |   -0.98   -0.99 |    1.00    0.99
cs_angles |  0.0080 -0.0010 |  0.1000  0.0923 | -0.9844 -0.9947 |  0.9977  0.9910
optical_flow | -0.0001  0.0001 |  0.0280  0.0268 | -1.1716 -1.3707 |  1.1892  1.0058
v_err    | -0.0089 |  0.0558 | -0.4530 |  0.1499
landing_rewards |    8.42 |    3.65 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.13   -0.06    0.02 |    1.31    0.69    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.07    0.08    0.08
a_f      |   -0.06    0.10 |    0.68    1.85 |   -1.43   -3.14 |    1.44    3.14
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.10   -0.03   -0.04 |    0.04    0.04    0.02
w_rewards |   -0.54 |    0.42 |   -3.31 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.29 |    0.00 |    3.03
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.99 |    1.00    0.98
cs_angles |  0.0026  0.0045 |  0.0926  0.0888 | -0.9951 -0.9944 |  0.9993  0.9772
optical_flow |  0.0000 -0.0001 |  0.0274  0.0274 | -0.9701 -1.0786 |  1.3361  0.9901
v_err    | -0.0094 |  0.0559 | -0.4937 |  0.1783
landing_rewards |    8.45 |    3.62 |    0.00 |   10.00
landing_margin |    3

attitude |    0.01    0.04    0.04 |    1.17    0.65    1.88 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.08    0.07    0.08
a_f      |    0.07   -0.02 |    0.66    1.87 |   -1.39   -3.14 |    1.52    3.07
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.54 |    0.39 |   -1.72 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.29 |    0.00 |    2.88
seeker_angles |    0.01    0.00 |    0.09    0.09 |   -0.99   -0.99 |    0.99    0.99
cs_angles |  0.0063  0.0027 |  0.0916  0.0908 | -0.9891 -0.9897 |  0.9901  0.9910
optical_flow | -0.0000 -0.0000 |  0.0276  0.0281 | -1.3415 -1.2444 |  1.0330  1.3426
v_err    | -0.0084 |  0.0557 | -0.4531 |  0.1676
landing_rewards |    8.61 |    3.46 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00   -0.00    0.00 |    0.72    0.73    0.73 |   -3.46   -3.43   -3.46 |    3.43    3.46    3.45
norm_thrust |    0.99 |    0.77 |    0.00 |    3.46
fuel     |    1.74 |    0.24 |    1.24 |    2.60
rewards  |  -24.94 |    8.27 |  -84.53 |  -11.45
fuel_rewards |   -4.98 |    0.69 |   -7.45 |   -3.55
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.90 |   13.37 |    0.01 | 1255.96
norm_af  |    1.80 |    0.91 |    0.07 |    3.29
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.11    0.08    0.05 |    1.26    0.69    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.09    0.08    0.08
a_f      |    0.09    0.03 |    0.69

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1583   0.9558   4.9392  17.7841  13.7419   6.6061
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0049   0.0030   0.0103   6.6368   2.2852   2.4929
Update Cnt = 1210    ET =   1101.3   Stats:  Mean, Std, Min, Max
r_f      |    1.23    4.54  -17.98 |  170.10  166.13  208.70 | -367.88 -384.28 -399.97 |  387.08  366.16  381.55
v_f      |    0.00    0.00    0.01 |    0.05    0.05    0.05 |   -0.13   -0.11   -0.12 |    0.12    0.12    0.12
r_i      |    1.57  -16.22 -104.20 |  657.73  636.51  783.48 |-1300.87-1316.78-1333.16 | 1322.52 1325.02 1345.92
v_i      |    0.00    0.00    0.01 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.09    0.10    0.09
norm_rf  |    0.37 |    0.15 |    0.04 |    0.91
norm_vf  |    0.08 |    0.02 |    0.02 |    0.14
gs_f     |    1.36 |    1.76 |    0.01 |   12.27
thrust   |   -0.00   -0.00   -0.00 |    0.72    0.71    0.72 |   -3.44   -3.44   -3.44 |    3.46    3.45    3.46
norm_thrust |    

ADV1:  -0.0005212865629976987 0.013165616404860796 0.17004932014250157 -0.06802121555993985
ADV2:  -0.0156953799461964 0.7892589756996123 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0846   0.7029   3.8931  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0008   0.0030   6.6368   2.2852   2.4929
***** Episode 37835, Mean R = -23.0  Std R = 6.9  Min R = -41.4
PolicyLoss: 0.018
Policy_Beta: 0.0759
Policy_Entropy: 0.121
Policy_KL: 0.000597
Policy_SD: 0.584
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.35e+07
VF_0_ExplainedVarNew: 0.976
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.00331


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.0022794594404117285 0.012283287368141056 0.09234452475125848 -0.09753860201498088
ADV2:  0.021155327433031827 0.9020065690102763 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0096   1.3263   6.5541  23.6511  13.7419   8.1346
ValFun

***** Episode 38083, Mean R = -24.7  Std R = 7.5  Min R = -46.1
PolicyLoss: -0.00743
Policy_Beta: 0.0759
Policy_Entropy: 0.12
Policy_KL: 0.000696
Policy_SD: 0.576
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.36e+07
VF_0_ExplainedVarNew: 0.957
VF_0_ExplainedVarOld: 0.953
VF_0_Loss : 0.00137


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.0028918176414860154 0.014975108657567677 0.07234947416202941 -0.2426417888257929
ADV2:  0.0009305356674952684 0.8190030102065468 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0692   1.4624   7.0482  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0033   0.0017   0.0081   6.6368   2.2852   2.4929
***** Episode 38114, Mean R = -23.8  Std R = 9.1  Min R = -53.9
PolicyLoss: -0.0201
Policy_Beta: 0.0759
Policy_Entropy: 0.122
Policy_KL: 0.00059
Policy_SD: 0.577
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.36e+07
VF_0_ExplainedVarNew: 0.963
VF_0_E

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9446   1.0270   4.9728  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0009   0.0050   6.6368   2.2852   2.4929
***** Episode 38362, Mean R = -25.1  Std R = 8.4  Min R = -54.2
PolicyLoss: -0.0106
Policy_Beta: 0.0759
Policy_Entropy: 0.12
Policy_KL: 0.000795
Policy_SD: 0.571
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.37e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.00227


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.0016179043809786261 0.012021313773174053 0.0654042255787175 -0.11352053531791673
ADV2:  0.0013315042249335775 0.9004626489814874 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3337   0.5943   3.1081  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0012   0.0046   6.6368   2.2852   2.4929
***** Episode 38393, Mean R = -23.6  Std R = 7.2  

Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.00030563111517626284 0.013012979124088987 0.06036284389312342 -0.09229937124342136
ADV2:  0.00746992768191782 0.935871312466523 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3944   0.6570   2.7792  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0014   0.0049   6.6368   2.2852   2.4929
***** Episode 38641, Mean R = -24.9  Std R = 8.2  Min R = -47.0
PolicyLoss: -0.00824
Policy_Beta: 0.0759
Policy_Entropy: 0.12
Policy_KL: 0.000609
Policy_SD: 0.585
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.38e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.965
VF_0_Loss : 0.00322


ADV1:  0.0028362510098046034 0.009614760495991583 0.05719829727224324 -0.05660921510490169
ADV2:  -0.012008053293900775 0.9192537751236112 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4661   0.8439   4.5053  23.6511  13.7419   8.1346
ValF

***** Episode 38889, Mean R = -22.6  Std R = 7.2  Min R = -42.8
PolicyLoss: -0.0194
Policy_Beta: 0.114
Policy_Entropy: 0.122
Policy_KL: 0.00115
Policy_SD: 0.563
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.39e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.00192


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.005036051211931834 0.01061736727851133 0.0711357962270624 -0.05894132891661097
ADV2:  -0.026052122830147295 0.8933223766249799 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7366   1.4451   7.0399  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0063   0.0045   0.0135   6.6368   2.2852   2.4929
***** Episode 38920, Mean R = -24.4  Std R = 7.2  Min R = -41.4
PolicyLoss: -0.0161
Policy_Beta: 0.114
Policy_Entropy: 0.12
Policy_KL: 0.00191
Policy_SD: 0.59
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.39e+07
VF_0_ExplainedVarNew: 0.982
VF_0_Explaine

ADV1:  0.0039508797638864775 0.012811918201912614 0.06034201805030573 -0.16672229397770588
ADV2:  -0.005315504309356802 0.8590192494035823 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3433   0.5949   2.7717  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0043   0.0027   0.0103   6.6368   2.2852   2.4929
***** Episode 39168, Mean R = -21.3  Std R = 6.1  Min R = -43.2
PolicyLoss: -0.0221
Policy_Beta: 0.114
Policy_Entropy: 0.123
Policy_KL: 0.00127
Policy_SD: 0.55
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.4e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.00428


ADV1:  -0.0010371291020614974 0.011606395984749275 0.05898512117654919 -0.10444943052931799
ADV2:  0.019783577015332336 0.8895383212482971 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8395   0.7446   3.4166  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0012   0.0044   6.6368   2.2852   2.4

Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.0006248631436365111 0.015100131005258147 0.07664127730608677 -0.12778927656115735
ADV2:  0.009770636675874345 0.8983962864014772 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8725   0.8045   4.6165  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0009   0.0032   6.6368   2.2852   2.4929
***** Episode 39447, Mean R = -24.8  Std R = 7.6  Min R = -46.2
PolicyLoss: -0.017
Policy_Beta: 0.114
Policy_Entropy: 0.124
Policy_KL: 0.00161
Policy_SD: 0.566
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.41e+07
VF_0_ExplainedVarNew: 0.959
VF_0_ExplainedVarOld: 0.955
VF_0_Loss : 0.00766


ADV1:  0.00026581088598048733 0.013720972975286032 0.0627760257696359 -0.08059570360540695
ADV2:  0.004814678998108389 0.9195269343460352 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6703   1.3593   6.0360  23.6511  13.7419   8.1346
ValFun  

seeker_angles |    0.01    0.01 |    0.09    0.09 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0054  0.0053 |  0.0946  0.0923 | -0.9955 -0.9876 |  0.9974  0.9913
optical_flow | -0.0001  0.0000 |  0.0287  0.0257 | -1.4336 -1.3345 |  1.2456  1.2133
v_err    | -0.0084 |  0.0558 | -0.4533 |  0.1233
landing_rewards |    8.68 |    3.39 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.06
tracking_rewards |  -26.96 |    6.43 |  -69.13 |  -16.79
steps    |     376 |      20 |     331 |     415
***** Episode 39726, Mean R = -22.9  Std R = 8.6  Min R = -46.0
PolicyLoss: -0.00409
Policy_Beta: 0.114
Policy_Entropy: 0.124
Policy_KL: 0.00111
Policy_SD: 0.572
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.42e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.971
VF_0_Loss : 0.00974


ADV1:  -0.0026463907096772273 0.013528734275467594 0.07249962191366899 -0.08033145962943032
ADV2:  0.019611204295763376 0.9348367697331054 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/

seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.98   -0.99 |    0.99    1.00
cs_angles |  0.0043  0.0048 |  0.0913  0.0892 | -0.9759 -0.9893 |  0.9909  0.9996
optical_flow |  0.0002  0.0001 |  0.0286  0.0276 | -1.1847 -1.6328 |  1.0613  1.2366
v_err    | -0.0086 |  0.0557 | -0.4533 |  0.1785
landing_rewards |    8.68 |    3.39 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.07
tracking_rewards |  -26.58 |    5.47 |  -49.28 |  -16.40
steps    |     376 |      20 |     331 |     422
***** Episode 40036, Mean R = -23.2  Std R = 7.7  Min R = -49.7
PolicyLoss: -0.0334
Policy_Beta: 0.114
Policy_Entropy: 0.124
Policy_KL: 0.00131
Policy_SD: 0.581
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.43e+07
VF_0_ExplainedVarNew: 0.947
VF_0_ExplainedVarOld: 0.929
VF_0_Loss : 0.0114


ADV1:  -0.0012544438512493439 0.015102555581877928 0.08905143631553519 -0.2925430018571812
ADV2:  0.024460598057597333 0.8199121982068169 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max

attitude |    0.08   -0.01    0.05 |    1.17    0.66    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.10    0.08    0.08
a_f      |   -0.00   -0.03 |    0.66    1.83 |   -1.51   -3.14 |    1.48    3.13
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.05    0.04    0.02
w_rewards |   -0.52 |    0.43 |   -2.76 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.30 |    0.00 |    2.75
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.97   -0.99 |    1.00    1.00
cs_angles |  0.0027  0.0037 |  0.0916  0.0932 | -0.9729 -0.9907 |  0.9989  0.9952
optical_flow | -0.0000  0.0000 |  0.0282  0.0258 | -1.2304 -1.2290 |  1.2239  0.9357
v_err    | -0.0089 |  0.0556 | -0.4708 |  0.1352
landing_rewards |    8.52 |    3.55 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.03   -0.01   -0.00 |    1.27    0.66    1.92 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |   -0.02   -0.07 |    0.66    1.91 |   -1.51   -3.09 |    1.47    3.14
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.05    0.03    0.02
w_rewards |   -0.48 |    0.35 |   -1.54 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.30 |    0.00 |    3.07
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.98 |    1.00    0.99
cs_angles |  0.0018  0.0029 |  0.0905  0.0925 | -0.9856 -0.9837 |  0.9994  0.9916
optical_flow |  0.0002 -0.0001 |  0.0280  0.0265 | -1.3280 -1.4028 |  1.3465  1.1607
v_err    | -0.0090 |  0.0552 | -0.4518 |  0.1419
landing_rewards |    8.48 |    3.59 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.09    0.08    0.08
a_f      |    0.03   -0.03 |    0.61    1.83 |   -1.47   -3.13 |    1.53    3.13
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.10   -0.03   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.53 |    0.44 |   -3.01 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.31 |    0.00 |    3.06
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.99 |    0.99    0.97
cs_angles |  0.0014  0.0049 |  0.0899  0.0910 | -0.9996 -0.9932 |  0.9941  0.9697
optical_flow |  0.0001  0.0000 |  0.0273  0.0269 | -0.9670 -1.4080 |  1.5913  1.1856
v_err    | -0.0090 |  0.0561 | -0.5223 |  0.1519
landing_rewards |    8.68 |    3.39 |    0.00 |   10.00
landing_margin |    2.98 |   52.76 |   -0.08 |  930.49
tracking_rewards |  -26.51 |    5.77 |  -59.86 |  -11.03
steps    |     375 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.09    0.07    0.08
a_f      |    0.03    0.01 |    0.66    1.88 |   -1.33   -3.14 |    1.49    3.14
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.04   -0.02 |    0.05    0.03    0.02
w_rewards |   -0.47 |    0.39 |   -2.35 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.30 |    0.00 |    3.10
seeker_angles |    0.01    0.00 |    0.09    0.09 |   -0.99   -0.99 |    0.99    0.98
cs_angles |  0.0059  0.0013 |  0.0947  0.0876 | -0.9949 -0.9950 |  0.9923  0.9781
optical_flow |  0.0001  0.0001 |  0.0284  0.0270 | -1.1384 -1.1194 |  1.2689  1.1329
v_err    | -0.0088 |  0.0553 | -0.4526 |  0.1391
landing_rewards |    8.81 |    3.24 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.07
tracking_rewards |  -26.43 |    5.37 |  -48.64 |  -15.21
steps    |     375 |  

thrust   |   -0.01   -0.00   -0.00 |    0.71    0.71    0.70 |   -3.41   -3.46   -3.45 |    3.46    3.44    3.43
norm_thrust |    0.95 |    0.76 |    0.00 |    3.46
fuel     |    1.68 |    0.22 |    1.25 |    2.83
rewards  |  -23.24 |    7.17 |  -54.30 |  -11.53
fuel_rewards |   -4.80 |    0.63 |   -8.09 |   -3.56
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.84 |   12.45 |    0.01 |  195.45
norm_af  |    1.79 |    0.92 |    0.09 |    3.37
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.02    0.03    0.04 |    1.27    0.66    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |    0.04    0.02 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0835   1.0624   4.9584  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0025   6.6368   2.2852   2.4929
Update Cnt = 1350    ET =    991.5   Stats:  Mean, Std, Min, Max
r_f      |   -0.95   -3.38   13.07 |  184.97  172.17  197.97 | -389.40 -384.77 -372.95 |  380.98  396.71  385.44
v_f      |    0.00   -0.00   -0.00 |    0.05    0.04    0.05 |   -0.11   -0.11   -0.12 |    0.14    0.11    0.11
r_i      |   -4.36  -16.51   68.93 |  682.98  649.10  766.23 |-1280.96-1253.15-1298.06 | 1374.01 1252.02 1313.78
v_i      |   -0.00    0.00   -0.01 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.09    0.10
norm_rf  |    0.32 |    0.12 |    0.05 |    0.69
norm_vf  |    0.08 |    0.02 |    0.04 |    0.15
gs_f     |    1.50 |    2.38 |    0.01 |   19.28
thrust   |    0.00    0.00   -0.01 |    0.70    0.69    0.71 |   -3.46   -3.46   -3.46 |    3.46    3.41    3.46
norm_thrust |    

ADV1:  -0.002419238674141994 0.012339656993150195 0.04788308440240624 -0.09234561628067162
ADV2:  0.02545050976912746 0.9185362193527752 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2357   1.0235   4.7547  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0018   0.0063   6.6368   2.2852   2.4929
***** Episode 42175, Mean R = -23.3  Std R = 6.0  Min R = -41.1
PolicyLoss: -0.0165
Policy_Beta: 0.114
Policy_Entropy: 0.127
Policy_KL: 0.00171
Policy_SD: 0.561
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.51e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 0.00651


ADV1:  0.0010188271954454234 0.00981942070199049 0.062255835762682565 -0.08786584131322983
ADV2:  -0.001303987579713842 0.891095983399595 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9499   0.8800   4.8382  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0026   6.6368   2.2852   2.49

ADV1:  -0.0026912696293308214 0.012630497771538657 0.05200276811386697 -0.07897370713036483
ADV2:  0.02816686164019957 0.9107031972420997 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0145   0.4197   2.1988  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0035   0.0021   0.0068   6.6368   2.2852   2.4929
***** Episode 42454, Mean R = -25.6  Std R = 8.3  Min R = -46.8
PolicyLoss: -0.0179
Policy_Beta: 0.114
Policy_Entropy: 0.127
Policy_KL: 0.00146
Policy_SD: 0.581
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.52e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 0.00483


ADV1:  0.001937737842041801 0.012105878609069922 0.1566802408543585 -0.17938531521829737
ADV2:  -0.006226971901017768 0.8457015965179135 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6106   1.0287   5.4906  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0013   0.0048   6.6368   2.2852   2.49

ADV1:  0.0013883643204934452 0.010882271752676082 0.08123066386817107 -0.12923769897484888
ADV2:  0.006287736513629191 0.8583642937772333 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6601   0.9469   4.0669  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0013   0.0050   6.6368   2.2852   2.4929
***** Episode 42733, Mean R = -21.8  Std R = 6.0  Min R = -39.9
PolicyLoss: -0.0182
Policy_Beta: 0.114
Policy_Entropy: 0.128
Policy_KL: 0.00171
Policy_SD: 0.56
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.53e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.00349


ADV1:  -0.0002486022208083073 0.011420867164503974 0.06926702718167899 -0.10261045957191273
ADV2:  0.018951155272363497 0.8724053629691884 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5021   0.8192   4.1636  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0008   6.6368   2.2852   2.4

ADV1:  -0.002633371244322233 0.01252112336621293 0.07926213663244841 -0.14754958145761488
ADV2:  0.03145896830278216 0.8648432602374283 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6673   0.9545   3.8459  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0016   0.0067   6.6368   2.2852   2.4929
***** Episode 43012, Mean R = -23.4  Std R = 8.9  Min R = -52.7
PolicyLoss: -0.0195
Policy_Beta: 0.114
Policy_Entropy: 0.129
Policy_KL: 0.00127
Policy_SD: 0.57
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.54e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.00339


ADV1:  0.00017342620201314605 0.012060238189617049 0.07813622983878865 -0.07680770083110548
ADV2:  0.011405756280030648 0.897830829027846 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0399   1.0479   4.6632  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0013   6.6368   2.2852   2.4929

ADV1:  -0.0029509788513391215 0.011394449066059643 0.061158476079430035 -0.10345804208451043
ADV2:  0.036289225971501186 0.8807215031750404 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5384   0.9560   5.1440  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0038   0.0024   0.0078   6.6368   2.2852   2.4929
***** Episode 43291, Mean R = -22.3  Std R = 6.8  Min R = -37.6
PolicyLoss: -0.0199
Policy_Beta: 0.114
Policy_Entropy: 0.127
Policy_KL: 0.00141
Policy_SD: 0.565
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.56e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 0.00475


ADV1:  0.00029421414437143207 0.013160179247843278 0.09604995140543149 -0.08704007440706335
ADV2:  0.00896085827204277 0.894655628453945 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8875   1.3154   6.4682  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0009   0.0041   6.6368   2.2852   2.4

ADV1:  0.0021996394470031417 0.008637388124563071 0.050929984310048346 -0.05798515955289474
ADV2:  -0.00740118795074941 0.9077031286797652 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6814   0.8023   4.0127  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0018   0.0057   6.6368   2.2852   2.4929
***** Episode 43570, Mean R = -22.1  Std R = 5.6  Min R = -34.2
PolicyLoss: -0.0141
Policy_Beta: 0.114
Policy_Entropy: 0.131
Policy_KL: 0.00142
Policy_SD: 0.56
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.57e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00524


ADV1:  -0.0006818361608909478 0.011232372626619034 0.048725372842754064 -0.1687986978738545
ADV2:  0.02719556458595178 0.8294900745102393 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4968   0.7720   3.8867  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0007   0.0038   6.6368   2.2852   2.4

ADV1:  0.0007928498295015185 0.012771725056423754 0.1184346458593018 -0.26432152460849456
ADV2:  0.013189624073034263 0.7733624749586818 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8708   0.4055   2.0731  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0006   0.0025   6.6368   2.2852   2.4929
***** Episode 43849, Mean R = -23.1  Std R = 9.4  Min R = -55.6
PolicyLoss: -0.0215
Policy_Beta: 0.114
Policy_Entropy: 0.132
Policy_KL: 0.00142
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.58e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 0.00415


ADV1:  0.0022325326551006852 0.009069021561024257 0.05250641747176987 -0.11583598414607765
ADV2:  0.005205278394316874 0.8506366947705598 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5332   0.7096   3.1548  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0034   0.0014   0.0060   6.6368   2.2852   2.492

ADV1:  0.0014245014090641433 0.011915360683721322 0.06990451894621363 -0.12150785628668825
ADV2:  0.012146668584828234 0.8636274810938596 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5719   0.8777   5.0302  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0012   0.0045   6.6368   2.2852   2.4929
***** Episode 44128, Mean R = -24.0  Std R = 7.8  Min R = -46.0
PolicyLoss: -0.0253
Policy_Beta: 0.114
Policy_Entropy: 0.131
Policy_KL: 0.00172
Policy_SD: 0.563
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.59e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.00424


ADV1:  0.0006188528183455851 0.01130143781597217 0.07569960866136921 -0.05917257624227382
ADV2:  0.0004085306415932513 0.9021066068433481 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1873   0.5952   2.7182  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0009   0.0030   6.6368   2.2852   2.4

***** Episode 44376, Mean R = -24.5  Std R = 7.7  Min R = -46.2
PolicyLoss: -0.0227
Policy_Beta: 0.114
Policy_Entropy: 0.13
Policy_KL: 0.00113
Policy_SD: 0.569
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.6e+07
VF_0_ExplainedVarNew: 0.976
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.00721


ADV1:  0.001555521771901005 0.01006523471589612 0.1679969463976792 -0.08280834769036893
ADV2:  0.0012257170433286418 0.8281615384265743 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9812   1.3250   6.2997  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0009   0.0042   6.6368   2.2852   2.4929
***** Episode 44407, Mean R = -22.1  Std R = 7.8  Min R = -45.6
PolicyLoss: -0.018
Policy_Beta: 0.114
Policy_Entropy: 0.13
Policy_KL: 0.00171
Policy_SD: 0.558
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.6e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00531


ADV1:  1.678540645863806e-05 0.01086189016885056 0.0874329

optical_flow | -0.0001  0.0000 |  0.0283  0.0274 | -1.1814 -1.3597 |  1.1488  1.0655
v_err    | -0.0090 |  0.0548 | -0.4518 |  0.1520
landing_rewards |    9.13 |    2.82 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.04
tracking_rewards |  -26.13 |    5.52 |  -48.18 |  -16.30
steps    |     376 |      20 |     334 |     424
***** Episode 44686, Mean R = -22.9  Std R = 6.2  Min R = -42.1
PolicyLoss: -0.0175
Policy_Beta: 0.114
Policy_Entropy: 0.131
Policy_KL: 0.00135
Policy_SD: 0.55
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.61e+07
VF_0_ExplainedVarNew: 0.976
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.00383


ADV1:  0.0004007030382116028 0.013456686766735193 0.04891727819676676 -0.25384822780584126
ADV2:  0.016643804145600113 0.8249168383420636 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4930   1.8167   8.6680  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0025   6.6368   2.2852   2.4929

attitude |    0.06   -0.03   -0.01 |    1.11    0.66    1.77 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |   -0.03   -0.04 |    0.66    1.77 |   -1.44   -3.13 |    1.51    3.08
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.05    0.04    0.02
w_rewards |   -0.50 |    0.39 |   -2.41 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.30 |    0.00 |    2.93
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.98 |    1.00    1.00
cs_angles |  0.0012  0.0011 |  0.0947  0.0879 | -0.9934 -0.9778 |  0.9973  0.9962
optical_flow | -0.0000  0.0001 |  0.0269  0.0266 | -1.3265 -1.0585 |  1.1685  1.2025
v_err    | -0.0090 |  0.0552 | -0.4522 |  0.1581
landing_rewards |    9.10 |    2.87 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |    0.01   -0.06 |    0.63    1.84 |   -1.47   -3.14 |    1.43    3.14
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.48 |    0.38 |   -2.97 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.30 |    0.00 |    3.00
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.99 |    0.99    0.99
cs_angles |  0.0034  0.0034 |  0.0910  0.0856 | -0.9976 -0.9930 |  0.9895  0.9909
optical_flow |  0.0001  0.0001 |  0.0263  0.0257 | -1.2410 -1.0072 |  1.3433  1.1000
v_err    | -0.0090 |  0.0561 | -0.4999 |  0.1330
landing_rewards |    8.87 |    3.16 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.03
tracking_rewards |  -25.86 |    5.34 |  -48.20 |  -16.08
steps    |     377 |  

attitude |    0.04   -0.01    0.09 |    1.19    0.67    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.08
a_f      |   -0.00    0.09 |    0.65    1.84 |   -1.51   -3.11 |    1.43    3.14
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.05    0.03    0.02
w_rewards |   -0.49 |    0.35 |   -2.66 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.30 |    0.00 |    2.90
seeker_angles |    0.00    0.01 |    0.09    0.09 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0016  0.0056 |  0.0901  0.0908 | -0.9891 -0.9950 |  0.9960  0.9975
optical_flow | -0.0001  0.0001 |  0.0274  0.0280 | -1.2596 -1.2611 |  1.1051  1.3114
v_err    | -0.0089 |  0.0560 | -0.4529 |  0.1260
landing_rewards |    9.26 |    2.62 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.00   -0.08    0.12 |    1.20    0.64    1.83 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.06 |    0.09    0.07    0.08
a_f      |   -0.09    0.08 |    0.63    1.84 |   -1.48   -3.13 |    1.38    3.11
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.47 |    0.34 |   -1.84 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.30 |    0.00 |    3.04
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0019  0.0035 |  0.0909  0.0900 | -0.9958 -1.0000 |  0.9959  0.9999
optical_flow | -0.0000  0.0001 |  0.0289  0.0274 | -1.0564 -1.1797 |  1.2382  1.1497
v_err    | -0.0080 |  0.0556 | -0.4685 |  0.1284
landing_rewards |    9.16 |    2.77 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.07   -0.05 |    0.09    0.08    0.07
a_f      |    0.03   -0.07 |    0.64    1.80 |   -1.48   -3.14 |    1.48    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.45 |    0.37 |   -2.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.30 |    0.00 |    3.02
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.99 |    0.99    0.98
cs_angles |  0.0045  0.0016 |  0.0884  0.0891 | -0.9983 -0.9897 |  0.9885  0.9766
optical_flow | -0.0001  0.0001 |  0.0271  0.0267 | -0.9677 -1.0363 |  1.4137  1.1437
v_err    | -0.0082 |  0.0558 | -0.4535 |  0.1603
landing_rewards |    9.06 |    2.91 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.08 |    0.07
tracking_rewards |  -25.63 |    5.41 |  -54.42 |  -15.84
steps    |     374 |  

attitude |   -0.13   -0.02    0.14 |    1.27    0.64    1.91 |   -3.14   -1.53   -3.14 |    3.14    1.53    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.08    0.08    0.08
a_f      |   -0.03    0.15 |    0.64    1.94 |   -1.41   -3.14 |    1.32    3.14
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.10   -0.02   -0.04 |    0.04    0.02    0.02
w_rewards |   -0.50 |    0.43 |   -2.85 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.30 |    0.00 |    2.99
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.97 |    0.99    1.00
cs_angles |  0.0010  0.0006 |  0.0934  0.0890 | -0.9999 -0.9679 |  0.9942  0.9969
optical_flow |  0.0000  0.0001 |  0.0283  0.0261 | -1.3794 -1.3277 |  1.5507  1.0483
v_err    | -0.0091 |  0.0567 | -0.4701 |  0.1183
landing_rewards |    9.16 |    2.77 |    0.00 |   10.00
landing_margin |    3

attitude |   -0.04   -0.07   -0.03 |    1.30    0.68    1.89 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.09    0.08
a_f      |   -0.08   -0.08 |    0.68    1.86 |   -1.50   -3.14 |    1.51    3.11
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.44 |    0.36 |   -2.39 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.30 |    0.00 |    2.96
seeker_angles |    0.00   -0.00 |    0.09    0.09 |   -1.00   -0.99 |    1.00    1.00
cs_angles |  0.0014 -0.0016 |  0.0916  0.0903 | -0.9967 -0.9862 |  0.9969  0.9995
optical_flow | -0.0000  0.0000 |  0.0281  0.0265 | -1.2372 -1.3961 |  1.4268  1.1004
v_err    | -0.0090 |  0.0559 | -0.4550 |  0.1330
landing_rewards |    9.03 |    2.96 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.07    0.08    0.07
a_f      |    0.03   -0.07 |    0.64    1.82 |   -1.40   -3.14 |    1.41    3.13
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.10   -0.02   -0.02 |    0.05    0.02    0.02
w_rewards |   -0.45 |    0.33 |   -1.82 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    2.96
seeker_angles |   -0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.98    0.99
cs_angles | -0.0006  0.0046 |  0.0922  0.0893 | -0.9869 -0.9998 |  0.9822  0.9937
optical_flow | -0.0000  0.0001 |  0.0273  0.0267 | -1.0782 -1.2399 |  1.1365  0.9884
v_err    | -0.0088 |  0.0551 | -0.4524 |  0.1260
landing_rewards |    9.16 |    2.77 |    0.00 |   10.00
landing_margin |    2.95 |   52.17 |   -0.08 |  920.04
tracking_rewards |  -25.55 |    5.07 |  -50.85 |  -11.40
steps    |     373 |  

attitude |    0.05    0.03    0.05 |    1.18    0.65    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.53    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.08    0.08
a_f      |    0.04    0.07 |    0.66    1.84 |   -1.52   -3.14 |    1.47    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.04    0.03    0.02
w_rewards |   -0.47 |    0.36 |   -2.66 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.30 |    0.00 |    2.98
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.98   -1.00 |    0.99    0.99
cs_angles |  0.0008  0.0029 |  0.0904  0.0876 | -0.9798 -0.9994 |  0.9887  0.9923
optical_flow |  0.0000  0.0001 |  0.0276  0.0269 | -1.3706 -1.1471 |  1.3191  1.1640
v_err    | -0.0088 |  0.0554 | -0.4527 |  0.1621
landing_rewards |    8.94 |    3.08 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01   -0.02    0.06 |    1.18    0.63    1.84 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.06 |    0.07    0.08    0.08
a_f      |   -0.04    0.03 |    0.64    1.83 |   -1.42   -3.14 |    1.51    3.14
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.46 |    0.35 |   -2.35 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.30 |    0.00 |    3.00
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.99 |    1.00    0.99
cs_angles |  0.0008  0.0017 |  0.0883  0.0882 | -0.9893 -0.9938 |  0.9982  0.9911
optical_flow | -0.0000 -0.0001 |  0.0283  0.0259 | -1.2202 -1.1944 |  1.1738  1.1250
v_err    | -0.0094 |  0.0552 | -0.4521 |  0.1224
landing_rewards |    8.81 |    3.24 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.02   -0.06    0.10 |    1.36    0.69    1.90 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.07    0.08
a_f      |   -0.06    0.13 |    0.68    1.89 |   -1.46   -3.12 |    1.43    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.05    0.03    0.03
w_rewards |   -0.51 |    0.36 |   -1.69 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.31 |    0.00 |    3.03
seeker_angles |    0.00   -0.00 |    0.10    0.09 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0008 -0.0008 |  0.0968  0.0902 | -0.9924 -0.9956 |  0.9877  0.9861
optical_flow | -0.0000 -0.0000 |  0.0282  0.0269 | -1.3411 -1.1696 |  1.1592  1.1443
v_err    | -0.0094 |  0.0557 | -0.4522 |  0.1257
landing_rewards |    8.94 |    3.08 |    0.00 |   10.00
landing_margin |   -0

norm_thrust |    0.92 |    0.76 |    0.00 |    3.46
fuel     |    1.63 |    0.19 |    1.15 |    2.39
rewards  |  -20.96 |    6.19 |  -47.14 |  -10.45
fuel_rewards |   -4.66 |    0.55 |   -6.84 |   -3.28
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.03 |   12.97 |    0.01 |  495.98
norm_af  |    1.75 |    0.90 |    0.10 |    3.24
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.07    0.03    0.04 |    1.21    0.66    1.87 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.07    0.07    0.08
a_f      |    0.01    0.01 |    0.66    1.85 |   -1.44   -3.14 |    1.53    3.13
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0010   6.6368   2.2852   2.4929
Update Cnt = 1570    ET =    914.0   Stats:  Mean, Std, Min, Max
r_f      |    1.72    1.20  -10.72 |  199.96  166.61  198.78 | -388.86 -384.80 -391.90 |  384.64  397.92  393.25
v_f      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.11   -0.12   -0.10 |    0.10    0.11    0.10
r_i      |   12.01  -23.17  -51.80 |  713.14  648.54  758.80 |-1308.12-1176.55-1299.20 | 1364.11 1337.97 1306.00
v_i      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.09 |    0.10    0.10    0.10
norm_rf  |    0.29 |    0.11 |    0.05 |    0.67
norm_vf  |    0.08 |    0.02 |    0.03 |    0.15
gs_f     |    1.33 |    2.11 |    0.02 |   18.31
thrust   |   -0.01    0.00    0.00 |    0.69    0.70    0.70 |   -3.46   -3.44   -3.45 |    3.46    3.45    3.45
norm_thrust |    0.93 |    0.76 |    0.00 |    3.46
fuel     |    1.63 |    0.22 |    1.19 |    2.55
rewards  |  -21.48 

ADV1:  0.0020578377422329993 0.012363166784836378 0.13060109037738088 -0.10791759133338924
ADV2:  0.0010682485386171617 0.851211956385959 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2498   1.8013   8.8813  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0016   0.0055   6.6368   2.2852   2.4929
***** Episode 48995, Mean R = -20.4  Std R = 7.1  Min R = -37.1
PolicyLoss: -0.0164
Policy_Beta: 0.114
Policy_Entropy: 0.134
Policy_KL: 0.00098
Policy_SD: 0.561
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.77e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.00785


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.0019625493810745917 0.009029635221900714 0.13752622959345118 -0.06546804479624507
ADV2:  -0.01903486257093025 0.8536471118639479 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2178   0.4711   2.4843  23.6511  13.7419   8.1346
ValFun 

ADV1:  -0.0011750402617706473 0.010667282848506909 0.08364122584110989 -0.07827223021632403
ADV2:  0.027509699666558335 0.8447143437471601 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9695   1.5562   6.2722  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0013   0.0043   6.6368   2.2852   2.4929
***** Episode 49274, Mean R = -21.0  Std R = 5.6  Min R = -38.4
PolicyLoss: -0.0232
Policy_Beta: 0.0759
Policy_Entropy: 0.132
Policy_KL: 0.000991
Policy_SD: 0.569
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.78e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.0193


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.0026344260084547075 0.011953200932569153 0.049122358597611826 -0.1227489213482107
ADV2:  0.03139249322879615 0.8984784753402643 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   8.6469   3.8626  15.1945  23.6511  13.7419   8.1346
ValFu

***** Episode 49522, Mean R = -21.1  Std R = 6.2  Min R = -35.7
PolicyLoss: -0.0249
Policy_Beta: 0.0759
Policy_Entropy: 0.132
Policy_KL: 0.000727
Policy_SD: 0.568
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.79e+07
VF_0_ExplainedVarNew: 0.967
VF_0_ExplainedVarOld: 0.959
VF_0_Loss : 0.00629


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.0034839631927816553 0.01266516544893391 0.0970546673760837 -0.07236391680345274
ADV2:  0.02319327120037596 0.9129126530272037 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1340   1.7842   6.9157  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0040   0.0027   0.0090   6.6368   2.2852   2.4929
***** Episode 49553, Mean R = -23.8  Std R = 8.2  Min R = -45.7
PolicyLoss: -0.00902
Policy_Beta: 0.0759
Policy_Entropy: 0.131
Policy_KL: 0.000659
Policy_SD: 0.577
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.79e+07
VF_0_ExplainedVarNew: 0.974
VF_0_E

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0102   0.4668   2.2440  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0047   0.0020   0.0084   6.6368   2.2852   2.4929
***** Episode 49801, Mean R = -21.5  Std R = 7.4  Min R = -50.7
PolicyLoss: 0.00341
Policy_Beta: 0.114
Policy_Entropy: 0.13
Policy_KL: 0.00108
Policy_SD: 0.566
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.8e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 0.012


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.0001700647253513474 0.012757864465569459 0.07330439482568712 -0.12569634078384267
ADV2:  0.020276604384209657 0.8575328252570884 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4552   0.9701   4.7315  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0007   6.6368   2.2852   2.4929
***** Episode 49832, Mean R = -22.7  Std R = 7.2  Min 

Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.002572160653587319 0.00876000422204164 0.04096886511693726 -0.07976060096684512
ADV2:  0.0400810456781753 0.88133896233232 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4301   0.8761   4.5144  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0046   0.0023   0.0081   6.6368   2.2852   2.4929
***** Episode 50080, Mean R = -20.2  Std R = 5.5  Min R = -32.8
PolicyLoss: -0.022
Policy_Beta: 0.0759
Policy_Entropy: 0.133
Policy_KL: 0.000718
Policy_SD: 0.564
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.81e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.0154


ADV1:  0.000605498828318651 0.00962252704233851 0.14930649557421477 -0.18919299531737765
ADV2:  0.007569851803232566 0.7971493557962258 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3323   0.7349   3.1900  23.6511  13.7419   8.1346
ValFun  Gradie

***** Episode 50328, Mean R = -19.7  Std R = 5.6  Min R = -31.3
PolicyLoss: -0.0153
Policy_Beta: 0.0759
Policy_Entropy: 0.134
Policy_KL: 0.000647
Policy_SD: 0.563
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.82e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.0159


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.002841765102486615 0.0067548495167238255 0.0631436592457163 -0.040974128348007906
ADV2:  -0.03675751737450566 0.9015112795059392 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.6287   4.8024  15.2305  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0038   0.0022   0.0072   6.6368   2.2852   2.4929
***** Episode 50359, Mean R = -19.4  Std R = 6.0  Min R = -39.1
PolicyLoss: 0.00207
Policy_Beta: 0.0759
Policy_Entropy: 0.133
Policy_KL: 0.00115
Policy_SD: 0.574
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.82e+07
VF_0_ExplainedVarNew: 0.991
VF_0_Ex

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0443   1.1552   6.2068  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0011   0.0040   6.6368   2.2852   2.4929
***** Episode 50607, Mean R = -21.5  Std R = 7.7  Min R = -40.9
PolicyLoss: -0.0108
Policy_Beta: 0.114
Policy_Entropy: 0.133
Policy_KL: 0.00143
Policy_SD: 0.57
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.83e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.00319


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.0008270833092464217 0.011015850897660223 0.06784433277335977 -0.15619819417813163
ADV2:  0.00825517954384338 0.8297894494361261 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8235   0.8429   4.2383  23.6511  13.7419   8.1346
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0008   0.0031   6.6368   2.2852   2.4929
***** Episode 50638, Mean R = -21.0  Std R = 7.6  Min

cs_angles |  0.0019  0.0055 |  0.0892  0.0859 | -0.9959 -0.9884 |  0.9908  0.9375
optical_flow | -0.0001 -0.0001 |  0.0267  0.0254 | -1.2725 -1.0389 |  1.1993  0.9921
v_err    | -0.0085 |  0.0549 | -0.4587 |  0.1212
landing_rewards |    9.29 |    2.57 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.04
tracking_rewards |  -25.00 |    5.18 |  -45.49 |  -15.11
steps    |     377 |      21 |     333 |     419
***** Episode 50886, Mean R = -19.3  Std R = 5.2  Min R = -36.8
PolicyLoss: -0.0145
Policy_Beta: 0.0759
Policy_Entropy: 0.134
Policy_KL: 0.000592
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.84e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.0087


ADV1:  -0.002120306994363544 0.012564467372551132 0.3373148408088424 -0.08256178230687243
ADV2:  0.011538916332231298 0.7449227537083376 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7974   0.9394   3.7968  23.6511  13.7419   8.3767
ValFun  Gradients: u

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |    0.01    0.05 |    0.67    1.80 |   -1.42   -3.14 |    1.39    3.14
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.46 |    0.40 |   -3.44 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    3.00
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -0.98   -0.97 |    0.99    0.97
cs_angles |  0.0037  0.0022 |  0.0885  0.0848 | -0.9805 -0.9670 |  0.9882  0.9684
optical_flow |  0.0000  0.0002 |  0.0261  0.0263 | -1.0185 -0.9558 |  1.1385  1.3568
v_err    | -0.0088 |  0.0547 | -0.4531 |  0.1745
landing_rewards |    9.13 |    2.82 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.02
tracking_rewards |  -24.73 |    5.32 |  -45.09 |  -16.07
steps    |     377 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.09    0.07    0.08
a_f      |    0.03    0.09 |    0.70    1.87 |   -1.47   -3.13 |    1.54    3.13
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.10   -0.02   -0.04 |    0.04    0.02    0.03
w_rewards |   -0.48 |    0.39 |   -2.69 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    2.93
seeker_angles |    0.00   -0.00 |    0.09    0.09 |   -0.98   -1.00 |    1.00    0.98
cs_angles |  0.0023 -0.0004 |  0.0904  0.0870 | -0.9809 -0.9971 |  0.9999  0.9844
optical_flow | -0.0000  0.0001 |  0.0266  0.0260 | -1.0467 -1.2459 |  1.0579  1.0062
v_err    | -0.0092 |  0.0552 | -0.4531 |  0.1132
landing_rewards |    9.16 |    2.77 |    0.00 |   10.00
landing_margin |    3.21 |   56.84 |   -0.08 | 1002.35
tracking_rewards |  -25.19 |    5.24 |  -48.65 |   -8.83
steps    |     376 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.08    0.08    0.07
a_f      |   -0.00    0.09 |    0.69    1.77 |   -1.37   -3.14 |    1.53    3.14
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.47 |    0.39 |   -3.38 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    3.07
seeker_angles |    0.00   -0.00 |    0.09    0.09 |   -1.00   -0.97 |    0.98    0.99
cs_angles |  0.0022 -0.0004 |  0.0898  0.0898 | -0.9985 -0.9664 |  0.9847  0.9863
optical_flow |  0.0001  0.0002 |  0.0271  0.0269 | -1.0153 -1.2299 |  1.2913  1.2901
v_err    | -0.0086 |  0.0555 | -0.4619 |  0.1803
landing_rewards |    9.26 |    2.62 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.05
tracking_rewards |  -25.26 |    5.77 |  -66.05 |  -16.14
steps    |     375 |  

thrust   |   -0.00   -0.01    0.00 |    0.71    0.72    0.72 |   -3.43   -3.46   -3.45 |    3.46    3.44    3.43
norm_thrust |    0.97 |    0.77 |    0.00 |    3.46
fuel     |    1.71 |    0.22 |    1.13 |    2.65
rewards  |  -21.44 |    6.85 |  -58.69 |   -9.30
fuel_rewards |   -4.89 |    0.64 |   -7.59 |   -3.25
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.91 |   12.39 |    0.01 |  170.60
norm_af  |    1.68 |    0.93 |    0.07 |    3.26
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.06    0.01    0.10 |    1.17    0.63    1.80 |   -3.14   -1.57   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.06 |    0.08    0.08    0.08
a_f      |    0.02    0.20 |    0.63

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2340   0.4781   2.3612  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0026   6.6368   2.2852   2.4929
Update Cnt = 1690    ET =    961.8   Stats:  Mean, Std, Min, Max
r_f      |  -31.35    1.80   20.23 |  186.47  168.75  202.46 | -383.89 -388.46 -392.39 |  393.39  398.66  379.11
v_f      |    0.01    0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.10   -0.11 |    0.11    0.10    0.12
r_i      | -116.55    4.41   56.23 |  697.04  632.04  772.91 |-1357.06-1335.18-1288.13 | 1210.94 1328.66 1334.33
v_i      |    0.01    0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.10   -0.09 |    0.09    0.09    0.09
norm_rf  |    0.27 |    0.11 |    0.02 |    0.64
norm_vf  |    0.08 |    0.02 |    0.03 |    0.13
gs_f     |    1.44 |    2.75 |    0.01 |   37.85
thrust   |    0.00   -0.00    0.00 |    0.70    0.70    0.71 |   -3.45   -3.43   -3.45 |    3.46    3.45    3.46
norm_thrust |    

ADV1:  -0.0008781981246170573 0.017269733147015062 0.07126476683954153 -0.20308813887464222
ADV2:  0.05255924926907336 0.5936216979711673 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0477   0.4934   2.8479  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0032   6.6368   2.2852   2.4929
***** Episode 52715, Mean R = -22.3  Std R = 12.0  Min R = -78.7
PolicyLoss: -0.0543
Policy_Beta: 0.114
Policy_Entropy: 0.139
Policy_KL: 0.000472
Policy_SD: 0.567
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.91e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.953
VF_0_Loss : 0.00562


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.0019627096657960034 0.008916496658956085 0.06199415414266096 -0.07813546291829021
ADV2:  0.018616108107916633 0.869327720847673 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5872   0.7644   3.8077  23.6511  13.7419   8.3767
ValFu

***** Episode 52963, Mean R = -20.6  Std R = 5.9  Min R = -35.0
PolicyLoss: -0.00756
Policy_Beta: 0.114
Policy_Entropy: 0.138
Policy_KL: 0.00134
Policy_SD: 0.561
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.92e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 0.00558


ADV1:  0.001228226945200655 0.011610365330720716 0.058161704059100816 -0.24807737342220204
ADV2:  0.02179392915855684 0.6887185479267637 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8884   0.3323   1.7338  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0009   0.0039   6.6368   2.2852   2.4929
***** Episode 52994, Mean R = -21.9  Std R = 8.0  Min R = -43.1
PolicyLoss: -0.035
Policy_Beta: 0.114
Policy_Entropy: 0.137
Policy_KL: 0.00157
Policy_SD: 0.57
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.92e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.00521


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.001

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8491   0.7922   3.7363  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0038   0.0022   0.0078   6.6368   2.2852   2.4929
***** Episode 53242, Mean R = -20.6  Std R = 5.2  Min R = -34.4
PolicyLoss: -0.0219
Policy_Beta: 0.114
Policy_Entropy: 0.138
Policy_KL: 0.00149
Policy_SD: 0.572
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.93e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 0.00517


ADV1:  -0.005333086887679073 0.011340958104275848 0.06737573289933912 -0.0709989440178912
ADV2:  0.03424880858012863 0.9387316371564185 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6387   0.6635   3.4927  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0065   0.0038   0.0135   6.6368   2.2852   2.4929
***** Episode 53273, Mean R = -22.0  Std R = 7.8  Min R = -38.2
PolicyLoss: -0.00803
Policy_Beta: 0.114
Policy_Entropy: 0.138
Policy_KL: 0.00161
P

ADV1:  0.0015098691911973599 0.009035770630641173 0.0670480534428397 -0.05778108366815342
ADV2:  0.004121689614282559 0.8817316521008941 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5310   1.4659   7.4292  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0013   0.0044   6.6368   2.2852   2.4929
***** Episode 53521, Mean R = -20.4  Std R = 5.9  Min R = -36.8
PolicyLoss: -0.0207
Policy_Beta: 0.114
Policy_Entropy: 0.138
Policy_KL: 0.00105
Policy_SD: 0.56
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.94e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00433


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.0025504926842144266 0.011614733139680856 0.07009525534366112 -0.07508965070982748
ADV2:  0.02479641565453473 0.914700056481605 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0980   0.9348   4.3537  23.6511  13.7419   8.3767
ValFun  Gr

ADV1:  0.0015720632781724962 0.011915754938309701 0.28194897908587213 -0.08065489273090459
ADV2:  -0.012013037693968838 0.794419607578643 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2300   0.6131   2.5375  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0038   6.6368   2.2852   2.4929
***** Episode 53800, Mean R = -21.0  Std R = 4.9  Min R = -32.4
PolicyLoss: 0.00174
Policy_Beta: 0.114
Policy_Entropy: 0.134
Policy_KL: 0.00127
Policy_SD: 0.569
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.95e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 0.00411


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.0012949947884030937 0.014076315723795115 0.05596354520544816 -0.26042640351198654
ADV2:  0.02926059717018937 0.6257945685756403 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6452   0.3534   1.7678  23.6511  13.7419   8.3767
ValFun  G

Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.0028589206772622103 0.010460171440344394 0.09131615667299442 -0.1300651344830937
ADV2:  0.03473520815604178 0.8604072542741547 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2655   0.7799   4.1755  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0038   0.0022   0.0081   6.6368   2.2852   2.4929
***** Episode 54079, Mean R = -20.4  Std R = 5.6  Min R = -36.6
PolicyLoss: -0.0207
Policy_Beta: 0.114
Policy_Entropy: 0.139
Policy_KL: 0.00113
Policy_SD: 0.565
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.96e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.00136


ADV1:  0.003642301068119874 0.008942431349102222 0.045265289814879706 -0.05693234738956465
ADV2:  -0.0034624046957439044 0.8717647251792094 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9000   1.6259   8.3888  23.6511  13.7419   8.3767
ValFun

Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -1.7541734934078157e-05 0.009483018900302497 0.09476058111260971 -0.08105173149940748
ADV2:  0.01704593704937105 0.859387864927259 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4537   1.4603   7.6272  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0014   6.6368   2.2852   2.4929
***** Episode 54358, Mean R = -20.9  Std R = 6.0  Min R = -34.8
PolicyLoss: -0.0217
Policy_Beta: 0.114
Policy_Entropy: 0.137
Policy_KL: 0.00131
Policy_SD: 0.573
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.97e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00209


ADV1:  -0.001548005259654691 0.01030222524184586 0.060219497801214494 -0.10312832792599991
ADV2:  0.02283908213024808 0.8946987694350477 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9851   0.4848   2.5971  23.6511  13.7419   8.3767
ValFun  

***** Episode 54606, Mean R = -20.9  Std R = 7.4  Min R = -41.3
PolicyLoss: -0.00486
Policy_Beta: 0.114
Policy_Entropy: 0.138
Policy_KL: 0.00116
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.98e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.00386


ADV1:  0.0005868087160448558 0.013166019384332832 0.10872210290285284 -0.15855629005263439
ADV2:  0.02056549761047064 0.7908472318465105 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6238   0.7170   3.6379  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0023   6.6368   2.2852   2.4929
***** Episode 54637, Mean R = -19.5  Std R = 6.0  Min R = -34.1
PolicyLoss: -0.0286
Policy_Beta: 0.114
Policy_Entropy: 0.14
Policy_KL: 0.00108
Policy_SD: 0.546
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.98e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.961
VF_0_Loss : 0.00398


ADV1:  -0.003703518146233362 0.06808703868946239 0.11

optical_flow | -0.0001  0.0001 |  0.0275  0.0257 | -1.3214 -1.3164 |  1.1549  1.1951
v_err    | -0.0087 |  0.0558 | -0.4549 |  0.4961
landing_rewards |    9.16 |    2.77 |    0.00 |   10.00
landing_margin |    4.54 |   61.33 |   -0.06 | 1000.48
tracking_rewards |  -25.20 |    5.85 |  -54.92 |   -8.79
steps    |     375 |      31 |      12 |     416
***** Episode 54916, Mean R = -20.4  Std R = 5.7  Min R = -33.4
PolicyLoss: -0.0167
Policy_Beta: 0.114
Policy_Entropy: 0.137
Policy_KL: 0.000933
Policy_SD: 0.567
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.99e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.00357


ADV1:  -0.0011630837146741299 0.013164660479483527 0.13443600918693566 -0.17086959403717605
ADV2:  0.009632498793951748 0.8124045002234018 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6491   0.9245   4.6626  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0040   6.6368   2.2852   2.4

attitude |   -0.01   -0.01    0.01 |    1.17    0.64    1.86 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.01    0.10 |    0.64    1.85 |   -1.42   -3.13 |    1.47    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.52 |    0.42 |   -3.35 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    3.07
seeker_angles |   -0.00    0.01 |    0.09    0.09 |   -0.99   -0.99 |    0.98    1.00
cs_angles | -0.0002  0.0056 |  0.0911  0.0875 | -0.9921 -0.9859 |  0.9832  0.9991
optical_flow |  0.0000  0.0000 |  0.0277  0.0264 | -1.2072 -1.0945 |  1.1389  0.9776
v_err    | -0.0087 |  0.0558 | -0.4535 |  0.1209
landing_rewards |    9.19 |    2.72 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.08    0.07
a_f      |   -0.03   -0.07 |    0.66    1.92 |   -1.50   -3.13 |    1.46    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.47 |    0.34 |   -1.84 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    3.02
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -1.00 |    1.00    0.99
cs_angles |  0.0019  0.0047 |  0.0898  0.0920 | -0.9986 -0.9987 |  0.9953  0.9907
optical_flow | -0.0000  0.0001 |  0.0281  0.0257 | -1.1561 -1.0809 |  1.4308  1.0762
v_err    | -0.0083 |  0.0544 | -0.4529 |  0.1542
landing_rewards |    9.32 |    2.51 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.03
tracking_rewards |  -25.11 |    5.47 |  -53.27 |  -15.14
steps    |     376 |  

att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.03    0.03    0.15 |    1.20    0.67    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.08    0.08
a_f      |    0.03    0.07 |    0.67    1.81 |   -1.49   -3.14 |    1.41    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.03 |    0.05    0.03    0.02
w_rewards |   -0.44 |    0.33 |   -1.88 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    3.03
seeker_angles |    0.00    0.01 |    0.09    0.09 |   -0.99   -0.95 |    1.00    0.97
cs_angles |  0.0007  0.0061 |  0.0893  0.0918 | -0.9905 -0.9511 |  0.9985  0.9745
optical_flow |  0.0000  0.0001 |  0.0269  0.0262 | -0.9752 -1.3196 |  1.1325  1.2476
v_err    | -0.0086 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.08    0.07
a_f      |   -0.04    0.09 |    0.66    1.86 |   -1.41   -3.14 |    1.50    3.08
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.48 |    0.37 |   -2.90 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.30 |    0.00 |    3.05
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.99 |    1.00    0.98
cs_angles |  0.0027  0.0048 |  0.0925  0.0850 | -0.9932 -0.9916 |  0.9991  0.9816
optical_flow | -0.0001  0.0002 |  0.0289  0.0264 | -1.4790 -1.1949 |  1.5245  1.1529
v_err    | -0.0086 |  0.0554 | -0.4534 |  0.1442
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.06
tracking_rewards |  -24.61 |    5.29 |  -51.61 |  -15.77
steps    |     372 |  

attitude |   -0.07   -0.07    0.10 |    1.18    0.66    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.06 |    0.09    0.08    0.08
a_f      |   -0.07    0.11 |    0.66    1.83 |   -1.55   -3.11 |    1.44    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.48 |    0.36 |   -2.64 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    2.85
seeker_angles |    0.00    0.01 |    0.09    0.09 |   -0.99   -0.94 |    0.99    1.00
cs_angles |  0.0000  0.0074 |  0.0912  0.0892 | -0.9850 -0.9402 |  0.9905  0.9996
optical_flow |  0.0001 -0.0000 |  0.0266  0.0260 | -1.1153 -1.1618 |  1.0972  1.2088
v_err    | -0.0083 |  0.0551 | -0.4740 |  0.1196
landing_rewards |    9.19 |    2.72 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.06    0.03    0.04 |    1.20    0.65    1.82 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.08   -0.05 |    0.07    0.07    0.07
a_f      |    0.03   -0.03 |    0.65    1.82 |   -1.48   -3.13 |    1.39    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.46 |    0.32 |   -1.62 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.30 |    0.00 |    3.12
seeker_angles |   -0.00    0.01 |    0.09    0.08 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0014  0.0083 |  0.0888  0.0831 | -0.9992 -0.9991 |  0.9966  0.9988
optical_flow |  0.0001 -0.0000 |  0.0271  0.0261 | -1.3039 -1.1810 |  1.1551  1.0661
v_err    | -0.0080 |  0.0550 | -0.4501 |  0.1281
landing_rewards |    9.06 |    2.91 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.00   -0.00 |    0.70    0.69    0.70 |   -3.44   -3.45   -3.46 |    3.46    3.45    3.44
norm_thrust |    0.93 |    0.77 |    0.00 |    3.46
fuel     |    1.61 |    0.21 |    1.16 |    2.48
rewards  |  -20.84 |    6.76 |  -49.53 |   -9.14
fuel_rewards |   -4.61 |    0.60 |   -7.09 |   -3.32
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.85 |   12.32 |    0.01 |  201.56
norm_af  |    1.73 |    0.89 |    0.10 |    3.38
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.08   -0.07   -0.04 |    1.19    0.64    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |   -0.07   -0.08 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0169   0.5472   3.1108  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0044   0.0027   0.0095   6.6368   2.2852   2.4929
Update Cnt = 1850    ET =   1227.0   Stats:  Mean, Std, Min, Max
r_f      |    4.93  -14.42  -16.29 |  194.32  166.32  199.89 | -390.50 -392.64 -380.25 |  391.50  369.93  377.92
v_f      |    0.00   -0.00    0.00 |    0.05    0.04    0.05 |   -0.11   -0.10   -0.10 |    0.11    0.08    0.10
r_i      |    7.11  -43.27  -38.03 |  690.10  644.52  773.28 |-1312.21-1311.32-1310.21 | 1246.94 1331.34 1334.13
v_i      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.10    0.10    0.10
norm_rf  |    0.26 |    0.10 |    0.04 |    0.62
norm_vf  |    0.08 |    0.02 |    0.03 |    0.13
gs_f     |    1.28 |    2.20 |    0.02 |   22.30
thrust   |    0.00    0.01    0.00 |    0.70    0.69    0.69 |   -3.40   -3.46   -3.45 |    3.40    3.46    3.45
norm_thrust |    

ADV1:  0.0027437228997562344 0.008463932549553174 0.04947279230144405 -0.07058264236026535
ADV2:  -0.004418404133528185 0.8736128783808293 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   6.0936   4.5257  16.2392  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0019   0.0071   6.6368   2.2852   2.4929
***** Episode 57675, Mean R = -18.4  Std R = 4.6  Min R = -30.8
PolicyLoss: -0.0224
Policy_Beta: 0.0759
Policy_Entropy: 0.14
Policy_KL: 0.00057
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.1e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.0036


ADV1:  0.00010566447416910204 0.01013561858174085 0.11395113183753808 -0.09054907658559508
ADV2:  0.0222296813844621 0.8354930022754053 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7470   1.7156   7.8406  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0023   6.6368   2.2852   2.4929

***** Episode 57923, Mean R = -19.6  Std R = 4.5  Min R = -30.6
PolicyLoss: -0.0341
Policy_Beta: 0.114
Policy_Entropy: 0.142
Policy_KL: 0.00113
Policy_SD: 0.557
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.1e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00157


ADV1:  -0.0030501162067332697 0.012194368155629319 0.057281738755776856 -0.20360567204312752
ADV2:  0.04323651601734081 0.7773728131198983 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4417   0.6357   3.0670  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0038   0.0024   0.0084   6.6368   2.2852   2.4929
***** Episode 57954, Mean R = -21.6  Std R = 7.3  Min R = -44.5
PolicyLoss: -0.0292
Policy_Beta: 0.114
Policy_Entropy: 0.14
Policy_KL: 0.00147
Policy_SD: 0.565
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.11e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.00232


ADV1:  -0.0008511575343894309 0.020380950094666547 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4281   0.6410   3.1770  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0021   6.6368   2.2852   2.4929
***** Episode 58202, Mean R = -19.5  Std R = 4.1  Min R = -27.5
PolicyLoss: -0.017
Policy_Beta: 0.114
Policy_Entropy: 0.146
Policy_KL: 0.00137
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.12e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00358


ADV1:  -0.00034293931561548275 0.008889426395568993 0.03552656259599904 -0.07082916176023073
ADV2:  0.03307048802272142 0.8201966954440887 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1518   0.7641   4.1106  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0008   6.6368   2.2852   2.4929
***** Episode 58233, Mean R = -18.8  Std R = 5.4  Min R = -34.8
PolicyLoss: -0.0351
Policy_Beta: 0.114
Policy_Entropy: 0.146
Policy_KL: 0.00097

ADV1:  0.003125507032857222 0.011260049720118643 0.06882754601707897 -0.20431547363938218
ADV2:  0.00779125981702119 0.7337506102728915 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3009   0.5625   2.4336  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0083   6.6368   2.2852   2.4929
***** Episode 58481, Mean R = -21.9  Std R = 7.3  Min R = -42.5
PolicyLoss: -0.032
Policy_Beta: 0.114
Policy_Entropy: 0.145
Policy_KL: 0.00146
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.13e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.00283


ADV1:  -0.0015456349731415562 0.011111565588251078 0.12841357141266785 -0.12164415310792909
ADV2:  0.012020329222916473 0.8621571242611551 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6571   0.9618   5.1037  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0042   6.6368   2.2852   2.492

ADV1:  0.001801253976716971 0.008812316540558788 0.10258061858939518 -0.11068559727535288
ADV2:  0.0034967481882523994 0.8350196089564098 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5429   0.6610   3.1417  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0047   6.6368   2.2852   2.4929
***** Episode 58760, Mean R = -19.1  Std R = 5.9  Min R = -35.4
PolicyLoss: -0.0208
Policy_Beta: 0.114
Policy_Entropy: 0.146
Policy_KL: 0.00123
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.14e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.00166


ADV1:  -0.001674849239668789 0.010362637357766978 0.04681632742804476 -0.1453034131594111
ADV2:  0.02685738571375337 0.8902769921975652 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0580   1.1238   5.2082  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0044   6.6368   2.2852   2.4929

ADV1:  -0.00018530198466718857 0.009001221511259238 0.09680054214673578 -0.07288076812358418
ADV2:  0.00046736300350929126 0.8210406414692337 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5570   0.8104   4.4772  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0004   0.0018   6.6368   2.2852   2.4929
***** Episode 59039, Mean R = -19.7  Std R = 6.4  Min R = -38.7
PolicyLoss: -0.00195
Policy_Beta: 0.114
Policy_Entropy: 0.145
Policy_KL: 0.001
Policy_SD: 0.551
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.15e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00175


ADV1:  -0.0018047557568250654 0.009221692654448185 0.08200062462187807 -0.08858369049977777
ADV2:  0.03418428742039259 0.8623934516446756 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2811   0.7795   3.9612  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0047   6.6368   2.2852   

***** Episode 59287, Mean R = -18.6  Std R = 6.3  Min R = -38.8
PolicyLoss: -0.0259
Policy_Beta: 0.114
Policy_Entropy: 0.142
Policy_KL: 0.00136
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.16e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00119


ADV1:  -0.0012303096061673175 0.008894577236423213 0.0433688979332979 -0.07629858177095439
ADV2:  0.02830511844702993 0.8655340470661247 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1984   0.5734   2.8717  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0033   6.6368   2.2852   2.4929
***** Episode 59318, Mean R = -20.9  Std R = 6.0  Min R = -40.8
PolicyLoss: -0.0225
Policy_Beta: 0.114
Policy_Entropy: 0.143
Policy_KL: 0.000935
Policy_SD: 0.559
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.16e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.0013


ADV1:  0.0006908003756160959 0.006475024863717435 0.

***** Episode 59566, Mean R = -20.1  Std R = 5.0  Min R = -32.8
PolicyLoss: -0.0157
Policy_Beta: 0.114
Policy_Entropy: 0.142
Policy_KL: 0.00138
Policy_SD: 0.561
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.17e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00189


ADV1:  -0.0035314823747350566 0.009442717175253133 0.05078741870992154 -0.08103856617639038
ADV2:  0.0480304327934145 0.8448208718730044 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7324   0.8260   3.9510  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0023   0.0092   6.6368   2.2852   2.4929
***** Episode 59597, Mean R = -21.5  Std R = 6.7  Min R = -37.3
PolicyLoss: -0.0247
Policy_Beta: 0.114
Policy_Entropy: 0.143
Policy_KL: 0.00115
Policy_SD: 0.565
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.17e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00192


ADV1:  -0.0026282391678208385 0.011070973794027683 0.

seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.97 |    0.97    1.00
cs_angles |  0.0014  0.0013 |  0.0891  0.0859 | -0.9893 -0.9749 |  0.9719  0.9955
optical_flow | -0.0001  0.0002 |  0.0262  0.0246 | -1.0674 -1.0736 |  0.9772  1.1926
v_err    | -0.0087 |  0.0547 | -0.4520 |  0.1236
landing_rewards |    8.90 |    3.12 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.05
tracking_rewards |  -24.29 |    5.06 |  -55.26 |  -14.77
steps    |     377 |      20 |     335 |     420
***** Episode 59876, Mean R = -20.4  Std R = 6.1  Min R = -40.0
PolicyLoss: -0.0154
Policy_Beta: 0.114
Policy_Entropy: 0.142
Policy_KL: 0.00149
Policy_SD: 0.563
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.18e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00295


ADV1:  -0.002317284629391208 0.01084576802130917 0.045498652966561894 -0.05880303280298782
ADV2:  0.033257072191680025 0.9045992015982507 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Ma

attitude |    0.04   -0.01   -0.11 |    1.18    0.63    1.80 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.06   -0.05 |    0.08    0.07    0.08
a_f      |   -0.01   -0.10 |    0.64    1.79 |   -1.52   -3.13 |    1.51    3.14
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.04    0.02    0.03
w_rewards |   -0.41 |    0.35 |   -2.91 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.30 |    0.00 |    2.90
seeker_angles |   -0.00    0.00 |    0.09    0.09 |   -0.99   -0.99 |    0.99    0.99
cs_angles | -0.0001  0.0044 |  0.0871  0.0882 | -0.9936 -0.9863 |  0.9923  0.9885
optical_flow | -0.0000  0.0003 |  0.0256  0.0257 | -1.2762 -0.9615 |  1.2009  1.1495
v_err    | -0.0089 |  0.0550 | -0.4551 |  0.1282
landing_rewards |    9.19 |    2.72 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.02    0.02   -0.08 |    1.19    0.64    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |    0.02   -0.13 |    0.64    1.82 |   -1.45   -3.14 |    1.44    3.05
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.05    0.02    0.02
w_rewards |   -0.43 |    0.40 |   -3.79 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    2.97
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.98 |    1.00    1.00
cs_angles |  0.0017  0.0019 |  0.0875  0.0889 | -0.9963 -0.9828 |  0.9989  0.9993
optical_flow | -0.0000  0.0001 |  0.0277  0.0268 | -1.2094 -1.3307 |  1.3110  1.1557
v_err    | -0.0087 |  0.0550 | -0.4577 |  0.1644
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01   -0.01    0.03 |    1.26    0.65    1.90 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.01    0.13 |    0.67    1.90 |   -1.40   -3.06 |    1.46    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.42 |    0.34 |   -2.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.30 |    0.00 |    3.00
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.93 |    1.00    0.97
cs_angles |  0.0018  0.0035 |  0.0882  0.0886 | -0.9987 -0.9283 |  0.9952  0.9738
optical_flow | -0.0001  0.0001 |  0.0266  0.0256 | -1.0696 -1.1592 |  1.4684  1.1472
v_err    | -0.0089 |  0.0546 | -0.4518 |  0.1090
landing_rewards |    9.26 |    2.62 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.10   -0.01   -0.08 |    1.14    0.66    1.87 |   -3.14   -1.55   -3.14 |    3.14    1.53    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.10    0.07    0.08
a_f      |   -0.01   -0.11 |    0.66    1.85 |   -1.49   -3.12 |    1.53    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.43 |    0.36 |   -2.97 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.30 |    0.00 |    2.92
seeker_angles |   -0.00    0.01 |    0.09    0.09 |   -1.00   -0.98 |    0.98    1.00
cs_angles | -0.0019  0.0063 |  0.0856  0.0888 | -0.9992 -0.9762 |  0.9823  0.9962
optical_flow | -0.0001  0.0000 |  0.0242  0.0253 | -1.1046 -1.2463 |  0.9847  1.2102
v_err    | -0.0092 |  0.0545 | -0.4523 |  0.1217
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.08   -0.02   -0.04 |    1.21    0.68    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.03    0.00 |    0.68    1.84 |   -1.39   -3.12 |    1.41    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.04    0.03    0.03
w_rewards |   -0.42 |    0.33 |   -2.06 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.30 |    0.00 |    2.94
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -0.98 |    0.99    0.99
cs_angles |  0.0012  0.0023 |  0.0835  0.0876 | -0.9895 -0.9771 |  0.9947  0.9927
optical_flow | -0.0000  0.0000 |  0.0264  0.0245 | -1.0891 -1.1179 |  1.1716  0.8830
v_err    | -0.0089 |  0.0543 | -0.4519 |  0.1255
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00   -0.00   -0.00 |    0.68    0.69    0.68 |   -3.44   -3.44   -3.45 |    3.45    3.46    3.43
norm_thrust |    0.91 |    0.76 |    0.00 |    3.46
fuel     |    1.57 |    0.19 |    1.14 |    2.27
rewards  |  -19.46 |    5.44 |  -41.82 |   -9.67
fuel_rewards |   -4.51 |    0.53 |   -6.48 |   -3.26
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.91 |   12.80 |    0.01 |  304.39
norm_af  |    1.71 |    0.90 |    0.08 |    3.18
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.00    0.03   -0.01 |    1.21    0.67    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.08
a_f      |    0.03   -0.04 |    0.67

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4429   0.6563   3.6702  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   6.6368   2.2852   2.4929
Update Cnt = 2000    ET =   1051.4   Stats:  Mean, Std, Min, Max
r_f      |  -12.95  -14.96   17.01 |  179.42  162.19  205.88 | -388.10 -382.03 -382.99 |  374.88  390.57  391.74
v_f      |    0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.11   -0.12   -0.09 |    0.10    0.10    0.12
r_i      |  -24.61  -36.54   27.58 |  660.97  635.35  792.31 |-1348.27-1264.03-1237.23 | 1263.03 1312.16 1319.29
v_i      |    0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.10 |    0.10    0.09    0.10
norm_rf  |    0.25 |    0.10 |    0.04 |    0.53
norm_vf  |    0.08 |    0.02 |    0.04 |    0.13
gs_f     |    1.35 |    2.18 |    0.01 |   27.96
thrust   |   -0.01   -0.00    0.00 |    0.69    0.68    0.70 |   -3.46   -3.44   -3.46 |    3.46    3.38    3.45
norm_thrust |    

ADV1:  -0.001292770916698019 0.00860854280088914 0.1464524102468152 -0.06361109397258419
ADV2:  0.021423938319638763 0.8294601832161365 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2805   0.5290   2.2697  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0035   6.6368   2.2852   2.4929
***** Episode 62325, Mean R = -20.5  Std R = 5.7  Min R = -36.6
PolicyLoss: -0.0137
Policy_Beta: 0.114
Policy_Entropy: 0.146
Policy_KL: 0.00112
Policy_SD: 0.56
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.27e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00112


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.0018707418989201083 0.00901017300183939 0.06425159951372189 -0.06844263169033035
ADV2:  0.04058300778789778 0.8049389596068007 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3986   1.3043   6.5455  23.6511  13.7419   8.3767
ValFun  Grad

Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.0014217609098011107 0.010513656253203413 0.061218277395798826 -0.060605909327558355
ADV2:  0.016107661216384517 0.9323015431770546 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0392   0.4529   2.6804  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0036   6.6368   2.2852   2.4929
***** Episode 62604, Mean R = -18.4  Std R = 5.7  Min R = -33.2
PolicyLoss: -0.0114
Policy_Beta: 0.114
Policy_Entropy: 0.147
Policy_KL: 0.00101
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.28e+07
VF_0_ExplainedVarNew: 0.976
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.00102


ADV1:  0.0008881913510231475 0.00797603800933202 0.057839989897996436 -0.06767439416109561
ADV2:  0.006260236449450666 0.8584699878309238 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9229   1.4324   7.4547  23.6511  13.7419   8.3767
ValF

***** Episode 62852, Mean R = -19.1  Std R = 4.4  Min R = -30.2
PolicyLoss: -0.0304
Policy_Beta: 0.114
Policy_Entropy: 0.145
Policy_KL: 0.00109
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.29e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.00175


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.0026739989194155813 0.009816869381418993 0.05426913226498209 -0.22261805550954983
ADV2:  -0.0025009988517185424 0.7807251959786777 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.3061   2.1198  10.9627  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0019   0.0071   6.6368   2.2852   2.4929
***** Episode 62883, Mean R = -18.9  Std R = 5.2  Min R = -33.1
PolicyLoss: -0.0238
Policy_Beta: 0.0759
Policy_Entropy: 0.144
Policy_KL: 0.00216
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.29e+07
VF_0_ExplainedVarNew: 0.985
VF_0_E

ADV1:  0.002637462092079342 0.010416155838385644 0.19583950514031206 -0.07677773219531962
ADV2:  0.007656388381603616 0.8227070001891941 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7138   0.9513   4.7529  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0020   0.0071   6.6368   2.2852   2.4929
***** Episode 63131, Mean R = -20.6  Std R = 5.7  Min R = -35.3
PolicyLoss: -0.0268
Policy_Beta: 0.114
Policy_Entropy: 0.145
Policy_KL: 0.00164
Policy_SD: 0.552
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.3e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.00101


ADV1:  -0.0029688141480917487 0.0085515047508597 0.0557755721347557 -0.07881783912508064
ADV2:  0.04040812946576631 0.8355973834207467 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7100   0.9491   5.1374  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0020   0.0076   6.6368   2.2852   2.4929
*

Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.00010851179674615782 0.010583847551441051 0.05749055157597521 -0.3346628247798986
ADV2:  0.020029933229384053 0.7732551753476047 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1653   0.6474   2.7295  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0033   6.6368   2.2852   2.4929
***** Episode 63410, Mean R = -20.8  Std R = 9.6  Min R = -60.4
PolicyLoss: -0.0237
Policy_Beta: 0.114
Policy_Entropy: 0.145
Policy_KL: 0.00117
Policy_SD: 0.561
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.31e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00255


ADV1:  -8.692213596907147e-05 0.009773070746947467 0.2904622070889696 -0.06036649452868209
ADV2:  -0.005274008277856299 0.7832312631192829 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1734   1.6131   7.7320  23.6511  13.7419   8.3767
ValFu

***** Episode 63658, Mean R = -18.6  Std R = 5.9  Min R = -33.9
PolicyLoss: -0.0277
Policy_Beta: 0.114
Policy_Entropy: 0.145
Policy_KL: 0.00122
Policy_SD: 0.55
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.32e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00108


ADV1:  -0.0006449165296035774 0.009668482518920466 0.14429013108711153 -0.15626953639264496
ADV2:  0.01635250084798112 0.7959924857427358 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6429   0.6347   3.5384  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0026   6.6368   2.2852   2.4929
***** Episode 63689, Mean R = -19.9  Std R = 6.9  Min R = -42.9
PolicyLoss: -0.0156
Policy_Beta: 0.114
Policy_Entropy: 0.147
Policy_KL: 0.00139
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.32e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00171


ADV1:  0.0021031433760182283 0.012708144505950843 0.

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9408   0.9280   3.9467  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0004   0.0016   6.6368   2.2852   2.4929
***** Episode 63937, Mean R = -20.7  Std R = 7.9  Min R = -39.5
PolicyLoss: 0.0163
Policy_Beta: 0.114
Policy_Entropy: 0.147
Policy_KL: 0.00127
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.33e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.00136


ADV1:  0.0008256830177167538 0.00850885146663313 0.06281722858756533 -0.06618298742263251
ADV2:  0.01185665012416001 0.8235130257197808 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0945   1.4039   7.1760  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0025   6.6368   2.2852   2.4929
***** Episode 63968, Mean R = -19.9  Std R = 5.5  Min R = -32.8
PolicyLoss: -0.024
Policy_Beta: 0.114
Policy_Entropy: 0.147
Policy_KL: 0.00134
Pol

optical_flow |  0.0000 -0.0000 |  0.0256  0.0244 | -0.9227 -1.2812 |  1.2460  1.0447
v_err    | -0.0091 |  0.0554 | -0.4519 |  0.1257
landing_rewards |    9.32 |    2.51 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.04
tracking_rewards |  -24.63 |    5.20 |  -47.13 |  -15.33
steps    |     379 |      20 |     333 |     418
***** Episode 64216, Mean R = -20.5  Std R = 6.5  Min R = -44.1
PolicyLoss: -0.00936
Policy_Beta: 0.114
Policy_Entropy: 0.147
Policy_KL: 0.00164
Policy_SD: 0.554
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.34e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.002


ADV1:  -0.0029683973788678544 0.011254065304939418 0.06571039684013491 -0.07085194311315196
ADV2:  0.029940677629261798 0.9199862756753533 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9367   1.1579   5.6104  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0038   0.0022   0.0077   6.6368   2.2852   2.492

attitude |    0.02    0.05    0.04 |    1.18    0.67    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.08    0.07
a_f      |    0.06    0.04 |    0.68    1.89 |   -1.51   -3.12 |    1.49    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.42 |    0.36 |   -3.19 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.09
seeker_angles |    0.00   -0.00 |    0.08    0.09 |   -0.98   -1.00 |    0.96    0.99
cs_angles |  0.0004 -0.0015 |  0.0840  0.0874 | -0.9752 -0.9969 |  0.9593  0.9913
optical_flow |  0.0001  0.0001 |  0.0249  0.0254 | -1.0170 -0.9835 |  1.2021  1.2125
v_err    | -0.0091 |  0.0553 | -0.4773 |  0.2136
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.13    0.03    0.07 |    1.21    0.66    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.06   -0.05 |    0.08    0.08    0.07
a_f      |    0.04    0.07 |    0.65    1.84 |   -1.42   -3.13 |    1.51    3.13
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.04    0.03    0.02
w_rewards |   -0.43 |    0.35 |   -2.82 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.31 |    0.00 |    3.04
seeker_angles |   -0.00    0.00 |    0.09    0.09 |   -0.99   -0.99 |    0.98    0.99
cs_angles | -0.0006  0.0027 |  0.0859  0.0873 | -0.9865 -0.9863 |  0.9848  0.9932
optical_flow | -0.0001  0.0000 |  0.0250  0.0251 | -1.3359 -1.0654 |  0.8383  1.2841
v_err    | -0.0091 |  0.0550 | -0.4529 |  0.1128
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.00   -0.00 |    0.68    0.68    0.68 |   -3.44   -3.46   -3.46 |    3.43    3.44    3.46
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.55 |    0.19 |    1.11 |    2.09
rewards  |  -19.21 |    6.05 |  -45.43 |   -9.17
fuel_rewards |   -4.43 |    0.53 |   -5.97 |   -3.17
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.21 |   13.06 |    0.01 |  578.09
norm_af  |    1.83 |    0.94 |    0.09 |    3.26
norm_wf  |    0.01 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.09    0.01    0.08 |    1.26    0.65    1.94 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.10    0.08    0.08
a_f      |    0.02    0.04 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3549   1.4100   6.2067  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0016   0.0056   6.6368   2.2852   2.4929
Update Cnt = 2110    ET =   1111.8   Stats:  Mean, Std, Min, Max
r_f      |  -11.98   13.05    2.67 |  192.12  176.16  196.14 | -386.37 -367.79 -363.49 |  390.70  389.89  397.76
v_f      |    0.00    0.00   -0.00 |    0.05    0.04    0.05 |   -0.11   -0.12   -0.10 |    0.10    0.12    0.12
r_i      |  -30.83   20.89  -28.19 |  701.51  665.65  748.41 |-1385.46-1329.74-1372.40 | 1272.69 1347.73 1266.21
v_i      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.09    0.10
norm_rf  |    0.24 |    0.10 |    0.02 |    0.53
norm_vf  |    0.08 |    0.02 |    0.04 |    0.13
gs_f     |    1.05 |    1.19 |    0.01 |   10.96
thrust   |    0.00    0.00    0.00 |    0.68    0.68    0.69 |   -3.46   -3.39   -3.45 |    3.45    3.45    3.46
norm_thrust |    

ADV1:  -0.0016054355917986358 0.009134437216989024 0.05421653541877364 -0.06941902098290509
ADV2:  0.03029906678030576 0.8615632460795412 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.9235   6.1059  15.7228  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0041   6.6368   2.2852   2.4929
***** Episode 65735, Mean R = -17.7  Std R = 5.2  Min R = -33.8
PolicyLoss: -0.0218
Policy_Beta: 0.114
Policy_Entropy: 0.151
Policy_KL: 0.000454
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.4e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00138


ADV1:  -0.0015598521277507052 0.006991501283941613 0.06390419335820635 -0.05162422103702228
ADV2:  0.0333905547665995 0.8321719742974912 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5874   1.8759   9.9133  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0013   0.0049   6.6368   2.2852   2.492

ADV1:  0.001396880338915708 0.008270046070085144 0.046551754258174205 -0.1027462299678219
ADV2:  0.011387983943548579 0.8371083930834051 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0876   1.2562   6.2509  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0011   0.0037   6.6368   2.2852   2.4929
***** Episode 66014, Mean R = -20.6  Std R = 6.1  Min R = -39.9
PolicyLoss: -0.0283
Policy_Beta: 0.114
Policy_Entropy: 0.148
Policy_KL: 0.00146
Policy_SD: 0.557
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.41e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000903


ADV1:  -0.0002727569205314501 0.006691353748526156 0.0802057691469878 -0.08469095797491172
ADV2:  0.015620417437301356 0.8149602773695998 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2233   0.7854   3.7353  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0013   6.6368   2.2852   2.49

***** Episode 66262, Mean R = -19.2  Std R = 5.2  Min R = -31.6
PolicyLoss: 0.0271
Policy_Beta: 0.114
Policy_Entropy: 0.149
Policy_KL: 0.00144
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.42e+07
VF_0_ExplainedVarNew: 0.965
VF_0_ExplainedVarOld: 0.865
VF_0_Loss : 0.000334


ADV1:  0.006878703814615344 0.01227238910380538 0.2652572804516945 -0.08929335338481209
ADV2:  -0.03319155629563023 0.8674286416242702 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2592   1.1873   5.2259  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0085   0.0051   0.0177   6.6368   2.2852   2.4929
***** Episode 66293, Mean R = -19.1  Std R = 5.1  Min R = -38.6
PolicyLoss: -0.00759
Policy_Beta: 0.114
Policy_Entropy: 0.149
Policy_KL: 0.00156
Policy_SD: 0.548
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.42e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 0.000137


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8989   1.2009   5.6775  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   6.6368   2.2852   2.4929
***** Episode 66541, Mean R = -20.0  Std R = 6.5  Min R = -35.6
PolicyLoss: -0.0268
Policy_Beta: 0.114
Policy_Entropy: 0.15
Policy_KL: 0.00126
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.43e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.000866


ADV1:  0.00130213195973474 0.008113347091190163 0.07925642663296656 -0.06131039079785483
ADV2:  0.003760154013037467 0.8159988111384973 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1784   0.8902   4.9457  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0010   0.0036   6.6368   2.2852   2.4929
***** Episode 66572, Mean R = -17.9  Std R = 5.0  Min R = -30.9
PolicyLoss: -0.0181
Policy_Beta: 0.114
Policy_Entropy: 0.15
Policy_KL: 0.00148
Po

ADV1:  0.001142181228795493 0.009293600702737766 0.11308584226216978 -0.08437338600298327
ADV2:  0.02022117128375976 0.7853905706716531 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0988   1.0078   5.1892  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0007   0.0029   6.6368   2.2852   2.4929
***** Episode 66820, Mean R = -21.3  Std R = 6.1  Min R = -40.9
PolicyLoss: -0.0328
Policy_Beta: 0.114
Policy_Entropy: 0.15
Policy_KL: 0.00146
Policy_SD: 0.551
Policy_lr_mult: 0.198
Steps: 1.2e+04
TotalSteps: 2.44e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.000422


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.0017233867544353529 0.007462047866010579 0.05126312848787934 -0.16406412194751585
ADV2:  0.027212795569959876 0.7926584564523625 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2936   0.8095   3.6688  23.6511  13.7419   8.3767
ValFun  G

ADV1:  -0.0005921742542586741 0.010618291294488281 0.13135904594550601 -0.09007313922718463
ADV2:  0.01716150262548848 0.8616579559718546 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3164   1.5436   6.9267  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0020   6.6368   2.2852   2.4929
***** Episode 67099, Mean R = -19.3  Std R = 5.1  Min R = -33.4
PolicyLoss: -0.0168
Policy_Beta: 0.114
Policy_Entropy: 0.148
Policy_KL: 0.000977
Policy_SD: 0.551
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.45e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.002


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.001023266896479559 0.007741825830989257 0.08769523608559288 -0.09757505906923392
ADV2:  0.005767887279221426 0.8501597878595238 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4807   0.6343   3.5963  23.6511  13.7419   8.3767
ValFun  G

Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.0009189080771273083 0.0078819060026436 0.03543302668388365 -0.10753368001071523
ADV2:  0.013768037887955387 0.8536134538176914 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8482   0.7414   3.6595  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0025   6.6368   2.2852   2.4929
***** Episode 67378, Mean R = -18.4  Std R = 6.4  Min R = -32.1
PolicyLoss: -0.026
Policy_Beta: 0.114
Policy_Entropy: 0.152
Policy_KL: 0.00146
Policy_SD: 0.53
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.46e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.000755


ADV1:  -0.001439922415483605 0.008696299548691298 0.05913289631171009 -0.054786128511644994
ADV2:  0.02766829265373705 0.8655403679807326 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.3801   1.9803  10.2434  23.6511  13.7419   8.3767
ValFun  Gr

Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  0.002001404584690233 0.009953810044580454 0.06750064475917306 -0.15529716310782193
ADV2:  0.008669330890118386 0.8044139103055135 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0300   1.2195   5.9238  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0012   0.0051   6.6368   2.2852   2.4929
***** Episode 67657, Mean R = -19.7  Std R = 4.8  Min R = -30.6
PolicyLoss: -0.027
Policy_Beta: 0.114
Policy_Entropy: 0.152
Policy_KL: 0.0012
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.47e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00369


ADV1:  -0.00042400106243450523 0.010935489693280929 0.07676745444414634 -0.16901937604668837
ADV2:  0.01974979956581119 0.8560104651557207 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0242   1.5178   7.8226  23.6511  13.7419   8.3767
ValFun  G

cs_angles |  0.0043  0.0021 |  0.0840  0.0865 | -0.9930 -0.9842 |  0.9966  0.9847
optical_flow | -0.0001  0.0000 |  0.0268  0.0258 | -1.3275 -1.1998 |  1.4783  1.2309
v_err    | -0.0088 |  0.0547 | -0.4524 |  0.1051
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -23.45 |    4.77 |  -49.60 |  -15.58
steps    |     378 |      21 |     335 |     419
***** Episode 67936, Mean R = -19.4  Std R = 5.9  Min R = -33.1
PolicyLoss: -0.0245
Policy_Beta: 0.114
Policy_Entropy: 0.153
Policy_KL: 0.00185
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.48e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00176


ADV1:  0.0014815657050761958 0.008544527607357005 0.1315227282921695 -0.08697188712411513
ADV2:  0.0017689713340187025 0.7946593799022114 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8339   0.8537   4.0652  23.6511  13.7419   8.3767
ValFun  Gradients: 

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.10    0.08    0.07
a_f      |    0.01   -0.20 |    0.68    1.91 |   -1.51   -3.13 |    1.42    3.08
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.10    0.02    0.02
w_rewards |   -0.41 |    0.37 |   -3.76 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.30 |    0.00 |    2.91
seeker_angles |   -0.00   -0.00 |    0.09    0.09 |   -1.00   -1.00 |    1.00    0.99
cs_angles | -0.0014 -0.0025 |  0.0863  0.0853 | -0.9992 -0.9991 |  0.9987  0.9914
optical_flow | -0.0001  0.0001 |  0.0251  0.0265 | -0.8812 -1.0340 |  1.0784  1.1663
v_err    | -0.0091 |  0.0554 | -0.4645 |  0.1205
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |    3.15 |   55.82 |   -0.06 |  984.43
tracking_rewards |  -23.60 |    4.56 |  -38.35 |  -12.86
steps    |     375 |  

attitude |   -0.07   -0.05    0.07 |    1.23    0.65    1.88 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.04   -0.01 |    0.66    1.87 |   -1.42   -3.12 |    1.44    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.41 |    0.31 |   -2.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.29 |    0.00 |    3.02
seeker_angles |   -0.00    0.00 |    0.09    0.08 |   -0.99   -0.99 |    0.98    1.00
cs_angles | -0.0006  0.0011 |  0.0851  0.0830 | -0.9916 -0.9940 |  0.9846  0.9980
optical_flow | -0.0001  0.0001 |  0.0247  0.0258 | -0.8146 -0.9004 |  1.3811  1.2860
v_err    | -0.0094 |  0.0559 | -0.7018 |  0.1203
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.14   -0.02    0.04 |    1.26    0.70    1.90 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.08    0.07    0.08
a_f      |   -0.02    0.12 |    0.71    1.90 |   -1.56   -3.11 |    1.48    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.39 |    0.29 |   -1.32 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.29 |    0.00 |    3.04
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -1.00   -0.98 |    0.98    1.00
cs_angles |  0.0021  0.0025 |  0.0843  0.0855 | -0.9966 -0.9827 |  0.9789  0.9977
optical_flow | -0.0001  0.0001 |  0.0250  0.0261 | -1.3521 -0.9979 |  1.1052  1.0704
v_err    | -0.0093 |  0.0541 | -0.4655 |  0.1144
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04   -0.02   -0.05 |    1.17    0.68    1.85 |   -3.14   -1.57   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.08    0.07
a_f      |   -0.01   -0.09 |    0.67    1.84 |   -1.54   -3.10 |    1.54    3.12
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.41 |    0.33 |   -2.69 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.30 |    0.00 |    3.04
seeker_angles |    0.00   -0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.96    0.99
cs_angles |  0.0033 -0.0009 |  0.0812  0.0872 | -0.9893 -0.9955 |  0.9595  0.9910
optical_flow | -0.0002  0.0000 |  0.0245  0.0261 | -1.0939 -1.0395 |  1.0635  1.2628
v_err    | -0.0096 |  0.0552 | -0.4534 |  0.1036
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04   -0.05   -0.20 |    1.13    0.66    1.77 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.06   -0.25 |    0.67    1.76 |   -1.50   -3.14 |    1.46    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.40 |    0.34 |   -2.15 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.30 |    0.00 |    3.03
seeker_angles |    0.00   -0.00 |    0.09    0.09 |   -0.98   -0.99 |    1.00    0.99
cs_angles |  0.0029 -0.0005 |  0.0863  0.0864 | -0.9806 -0.9916 |  0.9963  0.9938
optical_flow | -0.0000  0.0000 |  0.0259  0.0261 | -1.0475 -1.2147 |  0.9973  1.1183
v_err    | -0.0093 |  0.0543 | -0.4536 |  0.1254
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.00    0.06    0.08 |    1.26    0.65    1.88 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.09    0.08    0.07
a_f      |    0.05    0.10 |    0.66    1.87 |   -1.46   -3.14 |    1.40    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.03    0.02
w_rewards |   -0.41 |    0.33 |   -2.24 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.30 |    0.00 |    3.09
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0001  0.0014 |  0.0873  0.0830 | -0.9990 -0.9924 |  0.9970  0.9896
optical_flow | -0.0001  0.0001 |  0.0254  0.0269 | -1.5291 -1.3478 |  1.0312  1.3231
v_err    | -0.0094 |  0.0547 | -0.4526 |  0.1213
landing_rewards |    9.26 |    2.62 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.02    0.03    0.13 |    1.16    0.68    1.77 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |    0.03    0.20 |    0.69    1.78 |   -1.50   -3.11 |    1.53    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.39 |    0.31 |   -1.71 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.29 |    0.00 |    3.13
seeker_angles |   -0.00   -0.00 |    0.09    0.08 |   -0.99   -1.00 |    1.00    0.99
cs_angles | -0.0013 -0.0020 |  0.0864  0.0834 | -0.9851 -0.9983 |  0.9981  0.9928
optical_flow |  0.0001 -0.0001 |  0.0261  0.0254 | -1.0175 -1.2258 |  1.1136  0.9728
v_err    | -0.0096 |  0.0547 | -0.4526 |  0.1103
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.00   -0.00 |    0.68    0.68    0.68 |   -3.44   -3.45   -3.45 |    3.46    3.45    3.46
norm_thrust |    0.90 |    0.77 |    0.00 |    3.46
fuel     |    1.55 |    0.18 |    1.14 |    2.17
rewards  |  -19.05 |    6.43 |  -52.55 |   -7.98
fuel_rewards |   -4.43 |    0.52 |   -6.22 |   -3.25
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.79 |   12.46 |    0.01 |  201.44
norm_af  |    1.71 |    0.91 |    0.04 |    3.26
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.03   -0.02    0.12 |    1.23    0.65    1.83 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.08    0.07
a_f      |   -0.02    0.05 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0640   0.5458   2.8732  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0034   6.6368   2.2852   2.4929
Update Cnt = 2280    ET =   1055.1   Stats:  Mean, Std, Min, Max
r_f      |    2.76    7.75   -6.64 |  202.33  167.07  190.04 | -395.64 -363.23 -380.83 |  387.23  392.87  389.00
v_f      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.10    0.12
r_i      |  -11.52   40.85  -18.72 |  744.72  639.26  732.21 |-1340.54-1283.13-1317.30 | 1277.98 1326.95 1288.42
v_i      |    0.00   -0.00    0.00 |    0.05    0.04    0.05 |   -0.10   -0.09   -0.10 |    0.09    0.10    0.09
norm_rf  |    0.24 |    0.10 |    0.06 |    0.56
norm_vf  |    0.08 |    0.02 |    0.04 |    0.12
gs_f     |    1.10 |    1.52 |    0.01 |   12.19
thrust   |   -0.00    0.00    0.01 |    0.69    0.67    0.68 |   -3.46   -3.45   -3.46 |    3.45    3.44    3.42
norm_thrust |    

ADV1:  0.0019006577627952788 0.009678855329191839 0.05614757623072397 -0.08527563366533393
ADV2:  0.015472764701238104 0.8193528980667398 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9751   0.9067   4.5157  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0049   6.6368   2.2852   2.4929
***** Episode 71005, Mean R = -17.8  Std R = 5.6  Min R = -32.5
PolicyLoss: -0.0329
Policy_Beta: 0.0759
Policy_Entropy: 0.157
Policy_KL: 0.000707
Policy_SD: 0.529
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.6e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.00166


ADV1:  -0.002839992980985054 0.011286684653246358 0.12899861566810844 -0.2119419235849297
ADV2:  0.036146593536945486 0.8211861848530048 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8081   0.9108   4.6951  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0019   0.0074   6.6368   2.2852   2.4

***** Episode 71253, Mean R = -18.4  Std R = 6.7  Min R = -36.0
PolicyLoss: -0.0252
Policy_Beta: 0.0759
Policy_Entropy: 0.155
Policy_KL: 0.00057
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.61e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00317


ADV1:  -0.003130915023132039 0.008693267149740273 0.14564979007230916 -0.05464832952959686
ADV2:  0.013255920120931474 0.7822698385571896 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5925   1.0069   5.0887  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0019   0.0083   6.6368   2.2852   2.4929
***** Episode 71284, Mean R = -19.2  Std R = 5.5  Min R = -35.2
PolicyLoss: 0.0122
Policy_Beta: 0.0759
Policy_Entropy: 0.156
Policy_KL: 0.000583
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.61e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00192


ADV1:  -0.0007396852848926225 0.009919606126923178

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7956   1.4768   6.4638  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0009   0.0033   6.6368   2.2852   2.4929
***** Episode 71532, Mean R = -16.4  Std R = 4.7  Min R = -27.4
PolicyLoss: -0.011
Policy_Beta: 0.114
Policy_Entropy: 0.156
Policy_KL: 0.00131
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.62e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 0.00256


ADV1:  -0.0016511338920777855 0.007813799240779478 0.05165890028659326 -0.07352442523896649
ADV2:  0.030386509819436015 0.8574700752836872 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.3510   1.8009   9.3973  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0011   0.0043   6.6368   2.2852   2.4929
***** Episode 71563, Mean R = -19.2  Std R = 6.2  Min R = -38.2
PolicyLoss: -0.0185
Policy_Beta: 0.114
Policy_Entropy: 0.154
Policy_KL: 0.00159


ADV1:  0.0002394190609728062 0.008355544555313578 0.05746926498346022 -0.08491070971967206
ADV2:  0.02632395803462917 0.7996421718469924 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0853   1.1405   5.1025  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0024   6.6368   2.2852   2.4929
***** Episode 71811, Mean R = -18.0  Std R = 4.9  Min R = -29.6
PolicyLoss: -0.033
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.00107
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.63e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00208


ADV1:  -0.0007794555219615197 0.008818604436709813 0.08811576632156004 -0.0792946677488631
ADV2:  0.02336634540716187 0.8397039761245029 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3075   0.6248   3.3341  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0021   6.6368   2.2852   2.4929


***** Episode 72059, Mean R = -19.4  Std R = 5.7  Min R = -33.9
PolicyLoss: -0.0242
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.00128
Policy_SD: 0.55
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.64e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 0.00204


ADV1:  0.0003109569008534315 0.008068684834224774 0.08488079405304139 -0.059513099960830346
ADV2:  0.012408767932737728 0.8725902274120618 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2349   1.4325   7.8353  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0020   6.6368   2.2852   2.4929
***** Episode 72090, Mean R = -18.5  Std R = 4.8  Min R = -30.2
PolicyLoss: -0.0195
Policy_Beta: 0.114
Policy_Entropy: 0.154
Policy_KL: 0.00147
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.64e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00164


ADV1:  -0.0006961533574970844 0.005770368845478539 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8303   0.8539   4.1211  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0034   0.0019   0.0073   6.6368   2.2852   2.4929
***** Episode 72338, Mean R = -17.2  Std R = 4.5  Min R = -29.5
PolicyLoss: -0.028
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.00136
Policy_SD: 0.527
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.65e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.000702


ADV1:  -0.00136882222107114 0.016574105540871006 0.4382892830803758 -0.06715768604449263
ADV2:  -0.02313198711016868 0.6273442466627949 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1537   0.4066   2.3553  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0010   0.0044   6.6368   2.2852   2.4929
***** Episode 72369, Mean R = -18.3  Std R = 5.4  Min R = -34.1
PolicyLoss: 0.0279
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.00155
Po

ADV1:  0.0022132776490426734 0.010821161036856724 0.14735140335465435 -0.17533295097404789
ADV2:  0.009066000572669649 0.7952133345310427 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7307   0.8679   4.3830  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0014   0.0057   6.6368   2.2852   2.4929
***** Episode 72617, Mean R = -19.5  Std R = 6.4  Min R = -35.4
PolicyLoss: -0.0249
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.0011
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.66e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.00238


ADV1:  -3.0228294045032835e-05 0.008195882774930694 0.05957321640242691 -0.07720869488177245
ADV2:  0.02110431439881493 0.8551347377126564 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3768   1.3193   7.0137  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0006   0.0022   6.6368   2.2852   2.49

cs_angles |  0.0029  0.0028 |  0.0896  0.0870 | -0.9946 -0.9818 |  0.9792  0.9849
optical_flow | -0.0001  0.0001 |  0.0239  0.0262 | -1.0675 -1.1273 |  1.1298  1.3031
v_err    | -0.0087 |  0.0547 | -0.4522 |  0.1035
landing_rewards |    9.32 |    2.51 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.02
tracking_rewards |  -23.74 |    5.23 |  -49.20 |  -13.68
steps    |     375 |      20 |     332 |     415
***** Episode 72896, Mean R = -17.8  Std R = 4.8  Min R = -31.6
PolicyLoss: -0.019
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.00109
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.67e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00191


ADV1:  0.00036494151383373785 0.008059578825948144 0.04215889362670515 -0.1427347330467026
ADV2:  0.017699162128798615 0.8263730736342134 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2164   0.4566   2.1645  23.6511  13.7419   8.3767
ValFun  Gradients: u/

attitude |   -0.08    0.01    0.09 |    1.14    0.66    1.81 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |    0.01    0.06 |    0.66    1.80 |   -1.43   -3.14 |    1.56    3.14
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.34 |    0.29 |   -1.80 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.30 |    0.00 |    3.09
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -1.00 |    1.00    1.00
cs_angles |  0.0027  0.0008 |  0.0831  0.0846 | -0.9813 -0.9998 |  0.9983  0.9979
optical_flow |  0.0000  0.0002 |  0.0257  0.0251 | -0.9842 -1.0895 |  0.9364  1.0477
v_err    | -0.0090 |  0.0548 | -0.4525 |  0.1113
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01    0.00   -0.05 |    1.24    0.64    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.07    0.08    0.08
a_f      |   -0.00   -0.10 |    0.63    1.87 |   -1.47   -3.12 |    1.46    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.33 |    0.29 |   -2.12 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.30 |    0.00 |    3.07
seeker_angles |    0.00   -0.00 |    0.08    0.09 |   -0.94   -1.00 |    1.00    1.00
cs_angles |  0.0038 -0.0005 |  0.0845  0.0878 | -0.9410 -0.9990 |  0.9969  0.9989
optical_flow | -0.0001  0.0001 |  0.0244  0.0250 | -0.9772 -1.1570 |  1.1005  1.2175
v_err    | -0.0088 |  0.0541 | -0.4524 |  0.1170
landing_rewards |    9.23 |    2.67 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.05   -0.07   -0.06 |    1.19    0.65    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.10    0.07    0.08
a_f      |   -0.08   -0.20 |    0.65    1.82 |   -1.47   -3.12 |    1.49    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.10    0.02    0.03
w_rewards |   -0.37 |    0.38 |   -2.36 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.30 |    0.00 |    3.09
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -1.00   -0.96 |    0.99    1.00
cs_angles |  0.0007 -0.0006 |  0.0836  0.0845 | -0.9984 -0.9581 |  0.9942  0.9962
optical_flow | -0.0000  0.0002 |  0.0250  0.0261 | -1.0819 -0.8152 |  0.9273  1.2817
v_err    | -0.0090 |  0.0551 | -0.4524 |  0.1155
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |    3

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.09    0.08    0.07
a_f      |    0.01    0.04 |    0.64    1.83 |   -1.49   -3.12 |    1.51    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.42 |    0.42 |   -3.20 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.04
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.98   -0.93 |    0.98    1.00
cs_angles |  0.0023  0.0030 |  0.0889  0.0887 | -0.9790 -0.9263 |  0.9839  0.9989
optical_flow | -0.0001  0.0002 |  0.0243  0.0256 | -1.0449 -0.8686 |  0.9066  1.2036
v_err    | -0.0088 |  0.0553 | -0.4639 |  0.1181
landing_rewards |    9.29 |    2.57 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -23.99 |    5.62 |  -49.65 |  -14.56
steps    |     376 |  

norm_thrust |    0.89 |    0.76 |    0.00 |    3.46
fuel     |    1.51 |    0.17 |    1.11 |    1.96
rewards  |  -18.22 |    5.07 |  -33.33 |   -9.40
fuel_rewards |   -4.32 |    0.49 |   -5.63 |   -3.17
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.02 |   12.58 |    0.01 |  433.50
norm_af  |    1.80 |    0.92 |    0.12 |    3.43
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.02   -0.02   -0.17 |    1.26    0.59    1.92 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |   -0.04   -0.17 |    0.61    1.92 |   -1.44   -3.13 |    1.43    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0025   6.6368   2.2852   2.4929
Update Cnt = 2410    ET =    962.2   Stats:  Mean, Std, Min, Max
r_f      |    5.06   -9.63   -3.70 |  187.20  172.04  211.58 | -390.18 -363.58-1281.69 |  398.18  370.27  373.53
v_f      |    0.00    0.00    0.00 |    0.05    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.10    0.10    0.30
r_i      |   18.74  -35.45   -9.79 |  701.50  655.50  759.33 |-1298.83-1327.12-1365.80 | 1326.95 1290.36 1284.20
v_i      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.09    0.09
norm_rf  |    3.20 |   52.52 |    0.02 |  926.44
norm_vf  |    0.08 |    0.02 |    0.04 |    0.32
gs_f     |    1.32 |    2.24 |    0.01 |   25.39
thrust   |   -0.00    0.00    0.00 |    0.67    0.68    0.68 |   -3.40   -3.46   -3.46 |    3.46    3.46    3.46
norm_thrust |    0.88 |    0.76 |    0.00 |    3.46
fuel     |    1.53 |    0.20 |    0.19 |    2.08
rewards  |  -18.95 

ADV1:  -0.0001685125752497815 0.011286197300954037 0.14550901454450316 -0.23183758699081736
ADV2:  0.015316812567720316 0.7837521509994423 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8181   0.9822   5.5945  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0006   6.6368   2.2852   2.4929
***** Episode 75035, Mean R = -19.3  Std R = 6.2  Min R = -37.0
PolicyLoss: -0.0189
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.00171
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.75e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.000127


ADV1:  0.0010954366692550637 0.0073165321575947555 0.09164035549077187 -0.08628777554416323
ADV2:  -0.01859022240991533 0.8039639716482317 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5655   1.7860   8.7800  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0028   6.6368   2.2852   2

***** Episode 75283, Mean R = -19.2  Std R = 6.6  Min R = -35.3
PolicyLoss: -0.0204
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.00127
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.76e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.00018


ADV1:  0.0008614109956586645 0.008533034254823523 0.08625715611036477 -0.06671405193393287
ADV2:  0.0028240787935780356 0.824079143501308 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4070   0.7813   4.5657  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0010   0.0036   6.6368   2.2852   2.4929
***** Episode 75314, Mean R = -18.2  Std R = 5.2  Min R = -29.2
PolicyLoss: -0.0143
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.0013
Policy_SD: 0.552
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.76e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 7.13e-05


ADV1:  -0.00023603368956385615 0.008062227290136968

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0064   1.0136   5.6264  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0020   0.0075   6.6368   2.2852   2.4929
***** Episode 75562, Mean R = -17.8  Std R = 3.8  Min R = -24.9
PolicyLoss: -0.00155
Policy_Beta: 0.114
Policy_Entropy: 0.154
Policy_KL: 0.00115
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.77e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 4.79e-05


ADV1:  0.0006487810958577439 0.010125147037062862 0.05147615003715017 -0.0742369853528535
ADV2:  0.021615330987718437 0.834566742019817 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9351   1.3952   6.1098  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0018   6.6368   2.2852   2.4929
***** Episode 75593, Mean R = -19.3  Std R = 5.4  Min R = -32.1
PolicyLoss: -0.0319
Policy_Beta: 0.114
Policy_Entropy: 0.153
Policy_KL: 0.00113


ADV1:  -0.00356066739731477 0.011576796777241629 0.05920220442239005 -0.06609881999650317
ADV2:  0.032797510265335075 0.91168177571182 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1169   1.3053   6.2000  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0042   0.0026   0.0093   6.6368   2.2852   2.4929
***** Episode 75841, Mean R = -18.4  Std R = 6.7  Min R = -37.0
PolicyLoss: -0.0153
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.00159
Policy_SD: 0.536
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.78e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 0.000208


ADV1:  -0.0011131216169547571 0.02104326167501289 0.0468361078172837 -0.508306931523963
ADV2:  0.035688038344055116 0.5059680136854727 2.2096768504056423 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6278   0.2850   1.3878  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0007   0.0030   6.6368   2.

***** Episode 76089, Mean R = -19.5  Std R = 5.0  Min R = -29.4
PolicyLoss: -0.0165
Policy_Beta: 0.114
Policy_Entropy: 0.153
Policy_KL: 0.000978
Policy_SD: 0.55
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.79e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 9.97e-05


ADV1:  0.0012660994036190023 0.007935786707888186 0.08280726618118195 -0.17415582387606454
ADV2:  0.007950575774741078 0.7565942820000752 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1369   1.0034   5.8045  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0033   6.6368   2.2852   2.4929
***** Episode 76120, Mean R = -18.2  Std R = 5.4  Min R = -32.0
PolicyLoss: -0.0209
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.00156
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.79e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 5.18e-05


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5868   0.5900   3.1973  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0008   6.6368   2.2852   2.4929
***** Episode 76368, Mean R = -18.3  Std R = 5.0  Min R = -30.9
PolicyLoss: -0.0256
Policy_Beta: 0.114
Policy_Entropy: 0.154
Policy_KL: 0.00116
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.8e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 9.2e-05


ADV1:  -0.0015228263473767987 0.011351169122633724 0.07785632638858475 -0.23809165241926256
ADV2:  0.02868187521658693 0.7562981461067823 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9141   0.9411   4.9714  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0012   0.0048   6.6368   2.2852   2.4929
***** Episode 76399, Mean R = -18.0  Std R = 4.2  Min R = -29.1
PolicyLoss: -0.022
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.00159
P

ADV1:  -0.0026055773968419577 0.011541264548598927 0.06219655245049566 -0.31287028424784735
ADV2:  0.03142479376108746 0.774186505181993 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3233   0.7073   3.4500  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0017   0.0068   6.6368   2.2852   2.4929
***** Episode 76647, Mean R = -18.5  Std R = 4.9  Min R = -34.8
PolicyLoss: -0.02
Policy_Beta: 0.114
Policy_Entropy: 0.156
Policy_KL: 0.0012
Policy_SD: 0.533
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.81e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.000158


ADV1:  0.00013321734091043853 0.010383273186909675 0.32389692472854026 -0.0940701936923008
ADV2:  -0.0018772485698339237 0.7951390391121118 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3243   0.6941   3.7418  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0026   6.6368   2.2852   2.49

theta_cv |    0.27 |    0.30 |    0.00 |    3.01
seeker_angles |   -0.00   -0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.99    0.98
cs_angles | -0.0003 -0.0002 |  0.0842  0.0866 | -0.9870 -0.9983 |  0.9906  0.9817
optical_flow |  0.0001  0.0001 |  0.0244  0.0246 | -1.0019 -0.9697 |  1.1111  1.1068
v_err    | -0.0089 |  0.0555 | -0.4915 |  0.1184
landing_rewards |    9.35 |    2.46 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -23.25 |    4.34 |  -41.90 |  -14.35
steps    |     376 |      21 |     334 |     418
***** Episode 76926, Mean R = -17.7  Std R = 5.3  Min R = -31.4
PolicyLoss: -0.0219
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.00145
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.82e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 5.38e-05


Dynamics: Max Disturbance (m/s^2):  [0.00126622 0.00130788 0.00159816] 0.002422386686932909
ADV1:  -0.005999366125338468 0.11791048296

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |    0.03    0.03 |    0.63    1.85 |   -1.49   -3.13 |    1.48    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.02   -0.05 |    0.04    0.03    0.01
w_rewards |   -0.36 |    0.34 |   -2.91 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.30 |    0.00 |    3.12
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -0.99   -0.99 |    1.00    1.00
cs_angles |  0.0029  0.0025 |  0.0878  0.0835 | -0.9949 -0.9852 |  0.9969  0.9998
optical_flow |  0.0001  0.0000 |  0.0251  0.0253 | -1.1365 -1.0209 |  1.1564  1.2920
v_err    | -0.0091 |  0.0550 | -0.4532 |  0.1085
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |    2.74 |   48.56 |   -0.06 |  856.34
tracking_rewards |  -23.17 |    4.54 |  -39.76 |  -10.90
steps    |     375 |  

thrust   |   -0.00   -0.00   -0.00 |    0.69    0.68    0.71 |   -3.42   -3.43   -3.43 |    3.45    3.46    3.45
norm_thrust |    0.92 |    0.77 |    0.00 |    3.46
fuel     |    1.56 |    0.20 |    1.11 |    2.26
rewards  |  -18.46 |    5.36 |  -36.21 |   -8.97
fuel_rewards |   -4.48 |    0.56 |   -6.47 |   -3.19
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.86 |   13.11 |    0.01 |  772.71
norm_af  |    1.76 |    0.88 |    0.07 |    3.27
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.07   -0.02   -0.16 |    1.15    0.66    1.84 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.10    0.07    0.07
a_f      |   -0.03   -0.21 |    0.67

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2654   1.6668   8.9986  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0019   0.0082   6.6368   2.2852   2.4929
Update Cnt = 2510    ET =   1066.1   Stats:  Mean, Std, Min, Max
r_f      |   -2.01   19.96  -12.90 |  177.79  168.34  204.89 | -397.99 -387.87 -393.88 |  382.57  374.84  387.14
v_f      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.11   -0.11   -0.12 |    0.10    0.10    0.10
r_i      |    1.85   44.96  -37.94 |  678.28  639.34  785.29 |-1290.04-1266.70-1326.54 | 1313.19 1274.80 1344.50
v_i      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.09    0.10
norm_rf  |    0.23 |    0.09 |    0.02 |    0.46
norm_vf  |    0.08 |    0.01 |    0.04 |    0.13
gs_f     |    1.30 |    1.75 |    0.02 |   19.27
thrust   |   -0.00   -0.00    0.00 |    0.69    0.69    0.70 |   -3.45   -3.42   -3.46 |    3.45    3.44    3.43
norm_thrust |    

ADV1:  0.0016839206217697422 0.008052399110720995 0.05643846354482379 -0.09204224536079797
ADV2:  0.0073238462072183095 0.8265495838169872 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   6.8184   2.7026  11.8509  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0016   0.0055   6.6368   2.2852   2.4929
***** Episode 78135, Mean R = -17.7  Std R = 5.2  Min R = -30.5
PolicyLoss: -0.0267
Policy_Beta: 0.0759
Policy_Entropy: 0.16
Policy_KL: 0.000852
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.87e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000207


ADV1:  -0.0014338238935860538 0.00871093390779336 0.04863404696251855 -0.0835477877311803
ADV2:  0.03499006338998129 0.8473298595095752 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.3170   3.2721  11.4732  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0037   6.6368   2.2852   2.

***** Episode 78383, Mean R = -18.5  Std R = 5.8  Min R = -37.7
PolicyLoss: -0.0249
Policy_Beta: 0.114
Policy_Entropy: 0.156
Policy_KL: 0.00158
Policy_SD: 0.549
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.87e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.000293


ADV1:  0.0022869960845805595 0.0068192630288511115 0.09661579097783801 -0.05467811613430307
ADV2:  -0.030182008141348336 0.8778922526756132 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3062   1.4722   8.0796  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0017   0.0062   6.6368   2.2852   2.4929
***** Episode 78414, Mean R = -18.6  Std R = 6.5  Min R = -35.1
PolicyLoss: -0.00304
Policy_Beta: 0.114
Policy_Entropy: 0.156
Policy_KL: 0.00153
Policy_SD: 0.552
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.88e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 0.000185


ADV1:  -0.003048223357193954 0.010037006620270

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4659   0.6971   4.1814  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0016   0.0058   6.6368   2.2852   2.4929
***** Episode 78662, Mean R = -18.1  Std R = 5.3  Min R = -33.3
PolicyLoss: -0.0172
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.00186
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.88e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000128


ADV1:  -0.0009518692946867751 0.009904485012515491 0.05515015958571645 -0.08726728769417433
ADV2:  0.03212625376324256 0.8237666011945569 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7873   1.0477   4.3424  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0025   6.6368   2.2852   2.4929
***** Episode 78693, Mean R = -17.2  Std R = 5.5  Min R = -34.6
PolicyLoss: -0.0299
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.00128


ADV1:  -0.0004370000348144643 0.009154856005583184 0.042536727097631954 -0.07689849530895998
ADV2:  0.02411874421656673 0.8648081595711954 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8931   0.8215   4.4031  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0020   6.6368   2.2852   2.4929
***** Episode 78941, Mean R = -17.4  Std R = 5.6  Min R = -32.6
PolicyLoss: -0.0257
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.00153
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.9e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.000478


ADV1:  -0.002780536362277795 0.011037985279101574 0.18673019449425543 -0.08151668493801323
ADV2:  0.03057708914866955 0.8543216397906153 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9877   0.7831   4.1643  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0034   0.0020   0.0072   6.6368   2.2852   2.49

ADV1:  0.0004311420652335599 0.00871048723688017 0.053109475847335996 -0.05424942645114669
ADV2:  0.016443563740887002 0.8448483935787066 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8692   1.0647   5.1603  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   6.6368   2.2852   2.4929
***** Episode 79220, Mean R = -19.1  Std R = 4.8  Min R = -33.6
PolicyLoss: -0.0241
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.00121
Policy_SD: 0.552
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.91e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.000724


ADV1:  0.0008541193196647804 0.007602277419283022 0.06056169781588161 -0.06512157535518823
ADV2:  0.015144956621512782 0.8505767764632582 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2849   1.0607   5.5169  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0022   6.6368   2.2852   2.

***** Episode 79468, Mean R = -17.6  Std R = 4.3  Min R = -31.9
PolicyLoss: -0.0261
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.00157
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.92e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000812


ADV1:  -0.002409028866281267 0.007842343949381436 0.06382470564372844 -0.07172870707218715
ADV2:  0.025971392446782388 0.864499435859303 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2804   0.6090   2.8247  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0019   0.0064   6.6368   2.2852   2.4929
***** Episode 79499, Mean R = -18.3  Std R = 5.1  Min R = -33.3
PolicyLoss: -0.00903
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.00115
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.92e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00067


ADV1:  0.0029128915699328504 0.006432153811852276 

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0360   1.3391   6.8704  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0033   0.0020   0.0072   6.6368   2.2852   2.4929
***** Episode 79747, Mean R = -17.6  Std R = 5.0  Min R = -35.2
PolicyLoss: -0.00784
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.000815
Policy_SD: 0.521
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.93e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.000557


ADV1:  0.004741178350889729 0.006364925846278035 0.07895126228851895 -0.04820516450808143
ADV2:  -0.059704495015187625 0.913156714187075 3.0 -3.0
 *** BROKE ***   18 0.00427712919190526
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   7.4880   5.3037  17.1474  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0053   0.0032   0.0124   6.6368   2.2852   2.4929
***** Episode 79778, Mean R = -17.4  Std R = 4.9  Min R = -28.7
PolicyLoss: -0.000785
Policy_Beta: 0.

optical_flow |  0.0000  0.0001 |  0.0244  0.0243 | -1.2857 -1.1525 |  1.1807  0.8357
v_err    | -0.0089 |  0.0548 | -0.4534 |  0.1122
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.07 |    0.03
tracking_rewards |  -22.44 |    4.55 |  -36.80 |  -14.54
steps    |     376 |      19 |     332 |     418
***** Episode 80026, Mean R = -17.0  Std R = 4.6  Min R = -29.9
PolicyLoss: -0.00692
Policy_Beta: 0.0759
Policy_Entropy: 0.162
Policy_KL: 0.000891
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.94e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 0.000781


ADV1:  -0.0009343749751217961 0.012123907255683467 0.2251636051622482 -0.203847085245339
ADV2:  0.018899192118968684 0.7384591335149737 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9395   0.6978   3.7076  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0024   6.6368   2.2852   2.49

attitude |    0.02   -0.01   -0.07 |    1.24    0.64    1.88 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.09    0.07    0.07
a_f      |   -0.01   -0.07 |    0.65    1.87 |   -1.49   -3.14 |    1.42    3.12
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.34 |    0.32 |   -2.37 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.04
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -1.00   -0.98 |    0.99    0.99
cs_angles |  0.0002  0.0025 |  0.0839  0.0870 | -0.9956 -0.9841 |  0.9888  0.9907
optical_flow |  0.0002  0.0001 |  0.0244  0.0242 | -1.1127 -1.0360 |  1.0325  1.2429
v_err    | -0.0092 |  0.0550 | -0.4524 |  0.1138
landing_rewards |    9.32 |    2.51 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.05    0.02    0.00 |    1.24    0.69    1.84 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |    0.02   -0.07 |    0.68    1.85 |   -1.51   -3.14 |    1.51    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.36 |    0.30 |   -1.96 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.30 |    0.00 |    2.91
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -1.00   -1.00 |    0.99    0.99
cs_angles |  0.0002  0.0021 |  0.0867  0.0833 | -0.9992 -0.9984 |  0.9897  0.9855
optical_flow | -0.0001  0.0001 |  0.0254  0.0255 | -1.1891 -1.1088 |  1.2799  1.2047
v_err    | -0.0090 |  0.0548 | -0.4543 |  0.1120
landing_rewards |    9.32 |    2.51 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00   -0.00    0.00 |    0.67    0.68    0.69 |   -3.44   -3.46   -3.43 |    3.45    3.32    3.46
norm_thrust |    0.90 |    0.77 |    0.00 |    3.46
fuel     |    1.54 |    0.19 |    1.13 |    2.39
rewards  |  -17.95 |    5.42 |  -37.21 |   -8.38
fuel_rewards |   -4.41 |    0.54 |   -6.86 |   -3.24
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.83 |   12.65 |    0.01 |  256.70
norm_af  |    1.83 |    0.88 |    0.03 |    3.29
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.01   -0.01   -0.16 |    1.25    0.68    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.07    0.08    0.07
a_f      |   -0.02   -0.16 |    0.69

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7050   0.7155   3.3808  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0028   6.6368   2.2852   2.4929
Update Cnt = 2620    ET =   1105.7   Stats:  Mean, Std, Min, Max
r_f      |    1.53    6.54   12.58 |  177.27  168.35  213.27 | -507.05 -379.51 -394.06 |  366.98  735.61  913.32
v_f      |   -0.00    0.00    0.00 |    0.04    0.05    0.06 |   -0.10   -0.11   -0.10 |    0.13    0.30    0.65
r_i      |   10.25    0.68   16.78 |  666.12  658.06  771.48 |-1262.32-1335.87-1327.85 | 1270.09 1224.12 1311.77
v_i      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.08   -0.09   -0.10 |    0.09    0.09    0.09
norm_rf  |    3.46 |   57.18 |    0.03 | 1008.52
norm_vf  |    0.08 |    0.04 |    0.04 |    0.73
gs_f     |    1.37 |    2.44 |    0.01 |   31.10
thrust   |   -0.00   -0.00   -0.00 |    0.68    0.69    0.68 |   -3.34   -3.45   -3.46 |    3.45    3.45    3.46
norm_thrust |    

ADV1:  0.002495702857525445 0.009809002460166569 0.16241128716674025 -0.07046682570131353
ADV2:  -0.014147524917282267 0.8327250542185216 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4677   0.8907   4.7214  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0017   0.0064   6.6368   2.2852   2.4929
***** Episode 81545, Mean R = -19.1  Std R = 5.5  Min R = -33.3
PolicyLoss: -0.0058
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.00137
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.99e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.000408


ADV1:  -0.0015342845966837524 0.010160961159215293 0.0561504242930998 -0.1232853465275443
ADV2:  0.04086847690011339 0.8125270975608737 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8842   0.8778   3.8432  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0012   0.0048   6.6368   2.2852   2.492

ADV1:  -0.0025481935348618343 0.012625927074041582 0.08982450044078855 -0.09471452982575634
ADV2:  0.02039699938954202 0.9183402032134648 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4220   1.0827   4.8280  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0018   0.0067   6.6368   2.2852   2.4929
***** Episode 81824, Mean R = -22.1  Std R = 7.7  Min R = -40.4
PolicyLoss: -0.00906
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.00171
Policy_SD: 0.563
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.000212


ADV1:  0.005557284495289801 0.008914362109498612 0.06112119330180782 -0.06975594283330999
ADV2:  -0.0320263530886862 0.9108862794806848 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.2518   3.7494  13.7314  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0064   0.0038   0.0144   6.6368   2.2852   2.4929

***** Episode 82072, Mean R = -19.0  Std R = 6.7  Min R = -38.4
PolicyLoss: -0.00939
Policy_Beta: 0.0759
Policy_Entropy: 0.159
Policy_KL: 0.000587
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.01e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.00015


ADV1:  -0.001352199518638656 0.011364425679731014 0.08530881524972062 -0.07499316107884796
ADV2:  0.014852363430362819 0.9300949756546151 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.1963   1.4809   7.9156  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0011   0.0043   6.6368   2.2852   2.4929
***** Episode 82103, Mean R = -18.8  Std R = 5.6  Min R = -32.1
PolicyLoss: -0.0103
Policy_Beta: 0.0759
Policy_Entropy: 0.159
Policy_KL: 0.000642
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.01e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 0.000264


ADV1:  0.004391047377348218 0.00912266661787429

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2944   0.9884   4.5121  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0019   6.6368   2.2852   2.4929
***** Episode 82351, Mean R = -17.3  Std R = 4.4  Min R = -27.3
PolicyLoss: -0.0151
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.000482
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.02e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 8.13e-05


ADV1:  -0.0021111970543546466 0.010048518254417172 0.11107128427504898 -0.09821646465257977
ADV2:  0.04009504993826927 0.8275392451882767 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9116   0.9033   4.4402  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0016   0.0056   6.6368   2.2852   2.4929
***** Episode 82382, Mean R = -20.0  Std R = 5.4  Min R = -33.3
PolicyLoss: -0.0281
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.00123

ADV1:  -0.0021211294928873696 0.01092850623215869 0.04260719665957097 -0.12790525742506997
ADV2:  0.03716496850509553 0.8480065061077361 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1131   1.2241   5.6702  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0018   0.0071   6.6368   2.2852   2.4929
***** Episode 82630, Mean R = -17.6  Std R = 4.9  Min R = -31.5
PolicyLoss: -0.0274
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.00128
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.03e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.000163


ADV1:  0.0001370668358439061 0.010850325654153614 0.063099037007732 -0.15622147033982337
ADV2:  0.02493095876676009 0.7897697364600837 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2870   0.4951   2.5146  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0027   6.6368   2.2852   2.4929
*

***** Episode 82878, Mean R = -18.7  Std R = 6.2  Min R = -39.6
PolicyLoss: -0.0189
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.00135
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.04e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 9.11e-05


ADV1:  0.0011645216875001909 0.008131211941627196 0.03674796334856578 -0.10962831442972198
ADV2:  0.013193676258620581 0.8445603574104218 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0047   1.1469   5.8681  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0008   0.0031   6.6368   2.2852   2.4929
***** Episode 82909, Mean R = -17.2  Std R = 4.1  Min R = -31.5
PolicyLoss: -0.028
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.00119
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.04e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 6.07e-05


ADV1:  0.0020782414818559937 0.010164397371259857 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5650   0.6711   3.2343  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0018   0.0074   6.6368   2.2852   2.4929
***** Episode 83157, Mean R = -18.3  Std R = 5.3  Min R = -31.4
PolicyLoss: -0.0229
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.001
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.05e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.000103


ADV1:  -0.0015135886522188895 0.008568697866199083 0.0780768124486837 -0.11519413813076917
ADV2:  0.03751218808585128 0.7944794869417761 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5578   0.8991   3.8274  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0039   6.6368   2.2852   2.4929
***** Episode 83188, Mean R = -17.7  Std R = 4.6  Min R = -34.3
PolicyLoss: -0.0302
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.00133
Pol

cs_angles |  0.0007  0.0025 |  0.0856  0.0861 | -0.9773 -0.9899 |  0.9879  0.9932
optical_flow |  0.0000  0.0001 |  0.0238  0.0240 | -1.0623 -0.9665 |  1.1096  1.0729
v_err    | -0.0094 |  0.0551 | -0.4527 |  0.1108
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.07 |    0.02
tracking_rewards |  -23.28 |    4.98 |  -50.48 |  -15.21
steps    |     379 |      20 |     335 |     426
***** Episode 83436, Mean R = -18.6  Std R = 5.4  Min R = -30.7
PolicyLoss: -0.0262
Policy_Beta: 0.0759
Policy_Entropy: 0.162
Policy_KL: 0.000873
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.06e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 5.82e-05


ADV1:  -0.002985509456718842 0.009050726394388196 0.04815757857745134 -0.08277835356001673
ADV2:  0.04605843104058593 0.8361370566119506 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5414   0.7926   4.1832  23.6511  13.7419   8.3767
ValFun  Gradients:

attitude |    0.01   -0.01    0.02 |    1.21    0.66    1.85 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.08    0.07
a_f      |   -0.02   -0.06 |    0.66    1.86 |   -1.50   -3.13 |    1.40    3.14
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.32 |    0.30 |   -2.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.99
seeker_angles |    0.00   -0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.95    0.99
cs_angles |  0.0004 -0.0004 |  0.0826  0.0861 | -0.9870 -0.9979 |  0.9516  0.9852
optical_flow | -0.0001  0.0001 |  0.0235  0.0250 | -1.1738 -1.2564 |  1.1218  1.0805
v_err    | -0.0094 |  0.0551 | -0.4527 |  0.1444
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.02   -0.03    0.09 |    1.13    0.62    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.08    0.07
a_f      |   -0.03    0.09 |    0.62    1.83 |   -1.44   -3.14 |    1.40    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.01
w_rewards |   -0.33 |    0.26 |   -1.68 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.03
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -1.00   -0.99 |    0.92    0.99
cs_angles |  0.0005  0.0006 |  0.0850  0.0884 | -0.9997 -0.9926 |  0.9242  0.9946
optical_flow | -0.0000 -0.0001 |  0.0249  0.0253 | -1.0805 -1.1891 |  0.9699  1.2939
v_err    | -0.0089 |  0.0548 | -0.4528 |  0.1521
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.05   -0.00   -0.03 |    1.17    0.65    1.83 |   -3.14   -1.57   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.10    0.07    0.07
a_f      |   -0.01   -0.02 |    0.66    1.84 |   -1.57   -3.12 |    1.45    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.35 |    0.32 |   -3.13 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    2.94
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0015  0.0039 |  0.0858  0.0857 | -0.9990 -0.9910 |  0.9982  0.9863
optical_flow | -0.0001  0.0001 |  0.0246  0.0258 | -1.2266 -1.1296 |  1.0081  1.0459
v_err    | -0.0086 |  0.0548 | -0.4535 |  0.1138
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00   -0.01    0.00 |    0.68    0.68    0.68 |   -3.46   -3.46   -3.46 |    3.46    3.45    3.46
norm_thrust |    0.89 |    0.77 |    0.00 |    3.46
fuel     |    1.53 |    0.19 |    1.04 |    2.10
rewards  |  -18.26 |    5.80 |  -39.66 |   -7.58
fuel_rewards |   -4.37 |    0.54 |   -6.01 |   -2.98
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.89 |   12.58 |    0.01 |  579.59
norm_af  |    1.78 |    0.89 |    0.07 |    3.30
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.01    0.01    0.02 |    1.18    0.66    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |    0.00    0.01 |    0.66

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2248   1.2867   5.3139  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0019   0.0080   6.6368   2.2852   2.4929
Update Cnt = 2740    ET =   1140.0   Stats:  Mean, Std, Min, Max
r_f      |    5.37    3.79   14.28 |  194.61  161.32  200.68 | -394.04 -346.06 -398.99 |  387.40  390.86  395.17
v_f      |   -0.00   -0.00   -0.00 |    0.05    0.04    0.05 |   -0.10   -0.10   -0.09 |    0.10    0.10    0.10
r_i      |   14.77   10.91   69.15 |  723.99  639.96  741.87 |-1291.33-1258.22-1340.17 | 1365.81 1320.87 1325.13
v_i      |   -0.00   -0.00   -0.00 |    0.05    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.09    0.09    0.09
norm_rf  |    0.21 |    0.09 |    0.04 |    0.48
norm_vf  |    0.08 |    0.01 |    0.05 |    0.12
gs_f     |    1.12 |    1.42 |    0.02 |    9.54
thrust   |   -0.00    0.00   -0.00 |    0.68    0.68    0.68 |   -3.45   -3.40   -3.46 |    3.43    3.44    3.45
norm_thrust |    

ADV1:  -0.000709858817230475 0.007762341909840394 0.05277314768081931 -0.14234372287660957
ADV2:  0.030388101152999697 0.7441836956516457 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9153   1.0644   5.3465  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0024   6.6368   2.2852   2.4929
***** Episode 85265, Mean R = -20.3  Std R = 5.9  Min R = -32.7
PolicyLoss: -0.0297
Policy_Beta: 0.114
Policy_Entropy: 0.165
Policy_KL: 0.00117
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.13e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 4.51e-05


ADV1:  -0.004229085294039428 0.013221742394455286 0.0921637418496617 -0.17788748684560235
ADV2:  0.046732316373601875 0.8180621411654136 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0842   0.5364   3.0548  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0053   0.0031   0.0110   6.6368   2.2852   2.49

***** Episode 85513, Mean R = -17.6  Std R = 4.0  Min R = -27.2
PolicyLoss: -0.0274
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.00179
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.14e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 6.05e-05


ADV1:  -0.00014549478169321892 0.00601213700442068 0.07383371598250926 -0.035785877269071904
ADV2:  -0.012484128950634455 0.8503694673086856 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9999   1.3555   6.7306  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0006   6.6368   2.2852   2.4929
***** Episode 85544, Mean R = -17.7  Std R = 4.2  Min R = -29.0
PolicyLoss: 0.0114
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.0014
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.14e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.992
VF_0_Loss : 2.79e-05


ADV1:  -0.00035684160863229863 0.008628669711538

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7315   1.0941   5.0807  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0026   6.6368   2.2852   2.4929
***** Episode 85792, Mean R = -17.7  Std R = 5.9  Min R = -29.6
PolicyLoss: -0.00199
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.00142
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.15e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 5.35e-05


ADV1:  -0.003528007656059784 0.008461952325318135 0.03393265388905198 -0.07452403348901127
ADV2:  0.06483957960808213 0.8247897950523039 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0362   0.9804   5.1387  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0043   0.0027   0.0093   6.6368   2.2852   2.4929
***** Episode 85823, Mean R = -17.5  Std R = 4.6  Min R = -28.8
PolicyLoss: -0.0336
Policy_Beta: 0.114
Policy_Entropy: 0.162
Policy_KL: 0.0014

ADV1:  -0.0001612986232277944 0.009266800375605018 0.06458854998281471 -0.1197683367901815
ADV2:  0.019998546442229332 0.8481155972817493 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.9305   2.6479  12.1866  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0004   6.6368   2.2852   2.4929
***** Episode 86071, Mean R = -19.0  Std R = 6.5  Min R = -38.7
PolicyLoss: -0.0238
Policy_Beta: 0.114
Policy_Entropy: 0.162
Policy_KL: 0.00174
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.16e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 7.2e-05


ADV1:  0.0013537869346769709 0.0070177611153269285 0.06855050904345455 -0.04536381778186038
ADV2:  -0.031232485231744662 0.8497885027851916 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7680   0.8957   4.6863  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0038   6.6368   2.2852   2

***** Episode 86319, Mean R = -16.4  Std R = 6.2  Min R = -37.3
PolicyLoss: -0.0292
Policy_Beta: 0.114
Policy_Entropy: 0.164
Policy_KL: 0.00133
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.17e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 9.62e-05


ADV1:  0.0010159842148130315 0.006574126790856888 0.07241160022982007 -0.07052717020205934
ADV2:  0.003907906750645578 0.8332480788327783 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.4966   1.7454   7.8833  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0027   6.6368   2.2852   2.4929
***** Episode 86350, Mean R = -17.0  Std R = 3.6  Min R = -25.5
PolicyLoss: -0.019
Policy_Beta: 0.114
Policy_Entropy: 0.163
Policy_KL: 0.00143
Policy_SD: 0.53
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.17e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 3.61e-05


ADV1:  -0.0019298527471982966 0.008267099063153522 

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1141   0.8459   4.6683  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0034   0.0021   0.0079   6.6368   2.2852   2.4929
***** Episode 86598, Mean R = -18.1  Std R = 5.9  Min R = -33.2
PolicyLoss: -0.0219
Policy_Beta: 0.114
Policy_Entropy: 0.163
Policy_KL: 0.000976
Policy_SD: 0.532
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.18e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 8.65e-05


ADV1:  0.004137585816863763 0.007684132715597431 0.08029968307998048 -0.07101828792928755
ADV2:  -0.04008200857236818 0.9088868456757272 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0957   0.8737   3.9502  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0045   0.0027   0.0108   6.6368   2.2852   2.4929
***** Episode 86629, Mean R = -18.3  Std R = 4.5  Min R = -27.7
PolicyLoss: -0.004
Policy_Beta: 0.114
Policy_Entropy: 0.164
Policy_KL: 0.00157

ADV1:  0.0004356052101962094 0.007943697272758002 0.05212263869910155 -0.05826078470472516
ADV2:  0.021528069277904457 0.8147021831716156 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4193   1.5133   7.7068  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0014   6.6368   2.2852   2.4929
***** Episode 86877, Mean R = -17.0  Std R = 4.7  Min R = -26.5
PolicyLoss: -0.0305
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.00106
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.19e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000111


ADV1:  -0.0005116716142556027 0.006642332484492174 0.06430839668922883 -0.09062377417685297
ADV2:  0.020504218765122265 0.8129817031855553 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9288   0.9601   5.4426  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0013   6.6368   2.2852   2

seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.98 |    1.00    1.00
cs_angles |  0.0024  0.0025 |  0.0820  0.0813 | -0.9935 -0.9846 |  0.9953  0.9974
optical_flow | -0.0001  0.0000 |  0.0241  0.0254 | -1.0664 -1.2416 |  1.2011  1.1327
v_err    | -0.0089 |  0.0542 | -0.4525 |  0.1440
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.04
tracking_rewards |  -22.04 |    4.51 |  -42.02 |  -14.04
steps    |     377 |      20 |     333 |     415
***** Episode 87156, Mean R = -17.7  Std R = 5.0  Min R = -27.3
PolicyLoss: -0.0263
Policy_Beta: 0.114
Policy_Entropy: 0.162
Policy_KL: 0.00131
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.2e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 5.6e-05


ADV1:  -0.0012910126588389556 0.011015702563231393 0.0364079092331972 -0.07567793877971052
ADV2:  0.024687089648578995 0.9012852406576392 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max 

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.08
a_f      |   -0.05   -0.08 |    0.69    1.89 |   -1.46   -3.13 |    1.39    3.09
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.03 |    0.03    0.02    0.02
w_rewards |   -0.38 |    0.34 |   -2.92 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.97
seeker_angles |   -0.00    0.00 |    0.09    0.08 |   -0.97   -1.00 |    0.99    0.99
cs_angles | -0.0003  0.0001 |  0.0857  0.0815 | -0.9735 -0.9985 |  0.9903  0.9933
optical_flow | -0.0001  0.0000 |  0.0249  0.0240 | -1.0790 -1.3423 |  1.0923  1.2035
v_err    | -0.0093 |  0.0553 | -0.4606 |  0.1206
landing_rewards |    9.26 |    2.62 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -22.67 |    4.56 |  -42.65 |  -14.23
steps    |     377 |  

thrust   |   -0.00   -0.00    0.00 |    0.69    0.69    0.68 |   -3.46   -3.40   -3.45 |    3.43    3.43    3.45
norm_thrust |    0.90 |    0.77 |    0.00 |    3.46
fuel     |    1.53 |    0.18 |    1.03 |    2.05
rewards  |  -17.61 |    5.48 |  -35.55 |   -7.50
fuel_rewards |   -4.38 |    0.52 |   -5.87 |   -2.96
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.84 |   12.52 |    0.01 |  200.63
norm_af  |    1.81 |    0.90 |    0.11 |    3.34
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.03   -0.04   -0.06 |    1.28    0.67    1.92 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.02   -0.05 |    0.67

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7273   0.8947   4.6944  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0025   6.6368   2.2852   2.4929
Update Cnt = 2840    ET =   1138.7   Stats:  Mean, Std, Min, Max
r_f      |   -9.02   -1.04  -15.84 |  184.22  172.83  194.36 | -399.26 -357.51 -385.52 |  390.84  388.31  377.84
v_f      |   -0.00    0.00    0.01 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.11    0.10
r_i      |   -5.64  -20.90  -60.67 |  695.01  636.12  768.37 |-1319.31-1254.37-1347.52 | 1285.67 1312.68 1296.41
v_i      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.10    0.09    0.10
norm_rf  |    0.21 |    0.08 |    0.03 |    0.42
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.33 |    2.04 |    0.01 |   18.96
thrust   |   -0.00    0.00   -0.01 |    0.68    0.70    0.69 |   -3.45   -3.44   -3.46 |    3.44    3.43    3.44
norm_thrust |    

ADV1:  -0.0003911283281099777 0.009969937273681216 0.05263284549430425 -0.0650575119915684
ADV2:  0.01909053253803439 0.8923322100961716 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   9.4620   4.6198  16.5439  23.6511  13.7419   8.3767
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0015   6.6368   2.2852   2.4929
***** Episode 88365, Mean R = -19.4  Std R = 7.5  Min R = -48.1
PolicyLoss: -0.0184
Policy_Beta: 0.0759
Policy_Entropy: 0.161
Policy_KL: 0.00126
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.25e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00018


Dynamics: Max Disturbance (m/s^2):  [0.00127313 0.00130788 0.00159816] 0.0024260046138067644
ADV1:  -0.0012363385372424851 0.008852407790039412 0.04307394314294566 -0.06806284112707595
ADV2:  0.03175251623369751 0.8635837578211316 3.0 -3.0
 *** BROKE ***   3 0.0047349464148283005
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :  12.0733   9.6844  2

***** Episode 88613, Mean R = -17.9  Std R = 5.2  Min R = -30.7
PolicyLoss: -0.025
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.00118
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.26e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.000142


Dynamics: Max Disturbance (m/s^2):  [0.00127313 0.00130788 0.00159816] 0.0024260046138067644
ADV1:  0.0032945250271643103 0.006782573941533813 0.04515891007834616 -0.06892162324639922
ADV2:  -0.015919307371160082 0.8403811068311883 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7100   1.2033   5.7770  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0039   0.0025   0.0086   6.6368   2.2852   2.4929
***** Episode 88644, Mean R = -17.3  Std R = 4.9  Min R = -30.0
PolicyLoss: -0.0253
Policy_Beta: 0.114
Policy_Entropy: 0.162
Policy_KL: 0.00138
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.26e+07
VF_0_ExplainedVarNew: 0.993
VF_0_Ex

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9577   0.9083   3.8732  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0007   0.0028   6.6368   2.2852   2.4929
***** Episode 88892, Mean R = -19.2  Std R = 8.3  Min R = -37.5
PolicyLoss: -0.0182
Policy_Beta: 0.114
Policy_Entropy: 0.165
Policy_KL: 0.00128
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.27e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000104


Dynamics: Max Disturbance (m/s^2):  [0.00127313 0.00130788 0.00159816] 0.0024260046138067644
ADV1:  -0.0005885566522250763 0.0093626665352496 0.04846698492550511 -0.07666366183330398
ADV2:  0.023290692274915713 0.8697303564761657 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2595   1.2611   6.7781  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0016   6.6368   2.2852   2.4929
***** Episode 88923, Mean R = -18.2  Std R = 4.4  

Dynamics: Max Disturbance (m/s^2):  [0.00127313 0.00130788 0.00159816] 0.0024260046138067644
ADV1:  0.004251445236884182 0.00860937867097382 0.05547024627845987 -0.10463776528373248
ADV2:  -0.015926053981597032 0.8429428583799602 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3822   0.9425   5.2691  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0063   0.0031   0.0112   6.6368   2.2852   2.4929
***** Episode 89171, Mean R = -17.9  Std R = 5.0  Min R = -34.8
PolicyLoss: -0.0252
Policy_Beta: 0.114
Policy_Entropy: 0.163
Policy_KL: 0.0013
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.28e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000136


ADV1:  0.0018505067858009992 0.007799175988472824 0.05475449912442798 -0.0603740569492649
ADV2:  -0.005093244230079691 0.8507745307656415 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6886   0.8536   3.9669  23.6511  13.7419   9.6844
ValFun  

***** Episode 89419, Mean R = -17.7  Std R = 5.8  Min R = -33.4
PolicyLoss: -0.0182
Policy_Beta: 0.114
Policy_Entropy: 0.162
Policy_KL: 0.00145
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.29e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.000132


Dynamics: Max Disturbance (m/s^2):  [0.00127313 0.00130788 0.00159816] 0.0024260046138067644
ADV1:  0.0018531943626519942 0.010776714420804748 0.04538521030187567 -0.1399677341864568
ADV2:  0.016240339753760446 0.7874655032110391 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5050   0.9931   5.3790  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0012   0.0049   6.6368   2.2852   2.4929
***** Episode 89450, Mean R = -18.2  Std R = 5.3  Min R = -28.0
PolicyLoss: -0.0319
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.00132
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.29e+07
VF_0_ExplainedVarNew: 0.981
VF_0_Exp

ADV1:  0.0004891537209902136 0.008603316159790772 0.23127683437902358 -0.050208634084296655
ADV2:  0.0006520093269832511 0.7705442478544482 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2415   0.5646   2.3767  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0016   6.6368   2.2852   2.4929
***** Episode 89698, Mean R = -17.4  Std R = 5.7  Min R = -29.3
PolicyLoss: -0.00781
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.000906
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.14e+04
TotalSteps: 3.3e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.000114


ADV1:  0.002419601110807262 0.006309523976723526 0.07338095473962547 -0.06545582191214205
ADV2:  -0.03173583815888695 0.882558214288063 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9069   1.3605   6.9807  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0019   0.0066   6.6368   2.2852   2

Dynamics: Max Disturbance (m/s^2):  [0.00127313 0.00130788 0.00159816] 0.0024260046138067644
ADV1:  -0.0009136130387155286 0.009500252717639211 0.059730612337359434 -0.06587672127205742
ADV2:  0.023034419227129867 0.8576928404307573 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2181   0.4986   2.4241  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0026   6.6368   2.2852   2.4929
***** Episode 89977, Mean R = -18.2  Std R = 5.9  Min R = -32.9
PolicyLoss: -0.0198
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.000827
Policy_SD: 0.549
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.31e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 8.86e-05


ADV1:  0.0021720478668916265 0.008537865617628785 0.0557664069134422 -0.1200992888284893
ADV2:  0.005657224116935158 0.8264593976852181 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0727   1.3620   6.6172  23.6511  13.7419   9.6844
ValFun

seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.99    0.97
cs_angles | -0.0001  0.0001 |  0.0842  0.0810 | -0.9976 -0.9907 |  0.9861  0.9749
optical_flow |  0.0001  0.0001 |  0.0266  0.0252 | -1.3952 -0.9544 |  1.1960  1.1996
v_err    | -0.0093 |  0.0545 | -0.4536 |  0.1138
landing_rewards |    9.35 |    2.46 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -22.23 |    4.25 |  -38.72 |  -13.69
steps    |     377 |      19 |     334 |     418
***** Episode 90256, Mean R = -16.9  Std R = 5.3  Min R = -31.2
PolicyLoss: 0.012
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.00118
Policy_SD: 0.552
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.32e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 0.000145


ADV1:  -0.0006976046206390128 0.006592258153237809 0.03768633979137198 -0.06902619846324075
ADV2:  0.028461108441679133 0.808022534139397 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.06   -0.10 |    0.07    0.07    0.07
a_f      |    0.00    0.05 |    0.66    1.87 |   -1.55   -3.10 |    1.50    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.32 |    0.45 |   -6.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    2.89
seeker_angles |    0.00   -0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.98    0.98
cs_angles |  0.0010 -0.0007 |  0.0833  0.0857 | -0.9900 -0.9957 |  0.9831  0.9754
optical_flow | -0.0000  0.0002 |  0.0237  0.0245 | -1.1438 -1.1481 |  1.0275  1.2904
v_err    | -0.0095 |  0.0557 | -0.5914 |  0.1129
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -22.87 |    5.93 |  -71.11 |  -14.21
steps    |     378 |  

attitude |   -0.13    0.06    0.09 |    1.20    0.64    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.09    0.07    0.08
a_f      |    0.06    0.09 |    0.64    1.85 |   -1.47   -3.12 |    1.40    3.12
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.34 |    0.28 |   -2.30 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    2.73
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -0.98   -0.96 |    1.00    0.99
cs_angles |  0.0018  0.0049 |  0.0852  0.0850 | -0.9815 -0.9649 |  0.9963  0.9856
optical_flow | -0.0000  0.0000 |  0.0240  0.0249 | -1.3663 -1.2163 |  1.0784  1.1449
v_err    | -0.0090 |  0.0546 | -0.4525 |  0.1295
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.06 |    0.08    0.07    0.07
a_f      |   -0.00    0.05 |    0.61    1.85 |   -1.44   -3.13 |    1.52    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.33 |    0.31 |   -2.66 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    2.78
seeker_angles |    0.01    0.00 |    0.09    0.08 |   -0.99   -1.00 |    0.98    0.99
cs_angles |  0.0050  0.0033 |  0.0851  0.0849 | -0.9880 -0.9974 |  0.9833  0.9947
optical_flow | -0.0000  0.0001 |  0.0243  0.0251 | -0.9643 -1.0613 |  1.1458  1.1550
v_err    | -0.0089 |  0.0554 | -0.4534 |  0.5055
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |    1.64 |   29.23 |   -0.07 |  515.53
tracking_rewards |  -22.77 |    6.43 |  -98.82 |  -14.16
steps    |     376 |  

attitude |   -0.01   -0.06    0.02 |    1.17    0.65    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |   -0.05   -0.03 |    0.64    1.79 |   -1.48   -3.11 |    1.37    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.30 |    0.24 |   -1.47 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.30 |    0.00 |    3.12
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.97   -0.99 |    0.99    1.00
cs_angles |  0.0033  0.0007 |  0.0835  0.0827 | -0.9707 -0.9896 |  0.9912  0.9996
optical_flow | -0.0000  0.0002 |  0.0248  0.0261 | -1.1119 -1.2452 |  1.2795  1.1551
v_err    | -0.0089 |  0.0546 | -0.4512 |  0.1149
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.05   -0.01   -0.03 |    1.28    0.66    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |   -0.01   -0.08 |    0.66    1.89 |   -1.43   -3.14 |    1.48    3.12
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.33 |    0.28 |   -2.45 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.93
seeker_angles |   -0.00    0.00 |    0.08    0.09 |   -0.99   -0.98 |    0.99    0.99
cs_angles | -0.0011  0.0017 |  0.0828  0.0889 | -0.9871 -0.9807 |  0.9873  0.9863
optical_flow | -0.0000 -0.0000 |  0.0243  0.0262 | -0.9773 -1.1887 |  1.0842  1.1002
v_err    | -0.0091 |  0.0548 | -0.4534 |  0.1240
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.10   -0.01   -0.02 |    1.31    0.67    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |   -0.01   -0.06 |    0.68    1.89 |   -1.48   -3.13 |    1.46    3.09
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.31 |    0.24 |   -1.34 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.30 |    0.00 |    3.12
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0015  0.0045 |  0.0837  0.0865 | -0.9971 -0.9922 |  0.9978  0.9867
optical_flow |  0.0000  0.0000 |  0.0242  0.0240 | -1.0687 -1.1626 |  1.2464  1.2276
v_err    | -0.0088 |  0.0546 | -0.4539 |  0.1071
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.01   -0.00    0.00 |    0.69    0.67    0.68 |   -3.46   -3.43   -3.42 |    3.44    3.46    3.44
norm_thrust |    0.90 |    0.77 |    0.00 |    3.46
fuel     |    1.52 |    0.19 |    1.06 |    2.23
rewards  |  -17.83 |    5.54 |  -36.19 |   -7.48
fuel_rewards |   -4.36 |    0.54 |   -6.37 |   -3.06
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.87 |   12.51 |    0.01 |  221.32
norm_af  |    1.75 |    0.93 |    0.04 |    3.38
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.05    0.01    0.19 |    1.24    0.64    1.85 |   -3.14   -1.53   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.07    0.07    0.07
a_f      |    0.01    0.17 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1127   0.3607   2.1921  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0021   6.6368   2.2852   2.4929
Update Cnt = 2990    ET =   1056.0   Stats:  Mean, Std, Min, Max
r_f      |   -5.78    7.61  -12.12 |  196.04  164.33  199.19 | -396.58 -376.90 -385.19 |  374.07  387.69  385.02
v_f      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.11   -0.10   -0.11 |    0.11    0.12    0.09
r_i      |  -26.97    8.93  -28.56 |  697.33  656.57  763.08 |-1301.08-1322.98-1346.55 | 1280.80 1264.68 1315.75
v_i      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.10    0.10
norm_rf  |    0.21 |    0.09 |    0.03 |    0.46
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.34 |    2.17 |    0.01 |   19.80
thrust   |    0.00    0.01    0.00 |    0.69    0.67    0.67 |   -3.43   -3.44   -3.46 |    3.44    3.45    3.46
norm_thrust |    

ADV1:  -0.0005925745779434968 0.008486443491354568 0.03394604207925023 -0.05592155291289109
ADV2:  0.0281146303058296 0.8617651244378244 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2303   1.9424   9.7259  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0017   6.6368   2.2852   2.4929
***** Episode 93015, Mean R = -16.4  Std R = 4.0  Min R = -29.6
PolicyLoss: -0.0274
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.00133
Policy_SD: 0.517
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.43e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 6.74e-05


ADV1:  -0.0006214240992822956 0.009485965717313131 0.03356026838673337 -0.06914005442177068
ADV2:  0.029267567741739678 0.8529742248610708 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.8731   2.5621  10.6509  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0016   6.6368   2.2852   2.

***** Episode 93263, Mean R = -17.1  Std R = 5.2  Min R = -31.8
PolicyLoss: -0.0281
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.00138
Policy_SD: 0.52
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 3.44e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 7.63e-05


ADV1:  -0.0007247967311413493 0.012122148814943692 0.06332768987262244 -0.13137795288760745
ADV2:  0.026516215951747874 0.8384972629621014 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6310   1.3713   6.2044  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0022   6.6368   2.2852   2.4929
***** Episode 93294, Mean R = -20.0  Std R = 7.0  Min R = -40.6
PolicyLoss: -0.0265
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.00113
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.14e+04
TotalSteps: 3.44e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.000169


ADV1:  0.00015194264437573462 0.009724139118548853

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2469   0.5306   2.7095  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0004   0.0019   6.6368   2.2852   2.4929
***** Episode 93542, Mean R = -17.3  Std R = 5.7  Min R = -33.4
PolicyLoss: -0.0304
Policy_Beta: 0.114
Policy_Entropy: 0.164
Policy_KL: 0.0012
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.14e+04
TotalSteps: 3.45e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 6.23e-05


ADV1:  0.000517301095260273 0.007788211168710145 0.05272482124933758 -0.09257814893986538
ADV2:  0.02112397918437789 0.8051816338951054 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7537   1.5671   7.5664  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0004   0.0019   6.6368   2.2852   2.4929
***** Episode 93573, Mean R = -17.4  Std R = 5.3  Min R = -30.0
PolicyLoss: -0.0307
Policy_Beta: 0.114
Policy_Entropy: 0.165
Policy_KL: 0.00134
P

ADV1:  -0.00310939490015864 0.010112357656724804 0.03468025874714836 -0.07659952839019807
ADV2:  0.0403026434989615 0.8923425527568002 3.0 -3.0
 *** BROKE ***   6 0.004492652602493763
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   7.7469   6.0725  17.8539  23.6511  13.7419   9.6844
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0047   0.0022   0.0081   6.6368   2.2852   2.4929
***** Episode 93821, Mean R = -18.7  Std R = 5.6  Min R = -35.5
PolicyLoss: -0.0168
Policy_Beta: 0.0759
Policy_Entropy: 0.165
Policy_KL: 0.00449
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.46e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.000127


ADV1:  0.0029321268835143053 0.006642721315454019 0.029832481648683934 -0.0799498985113013
ADV2:  -0.007346138341045844 0.844769027503682 3.0 -3.0
 *** BROKE ***   1 0.006875268649309874
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :  14.2673  10.7067  24.9741  24.9741  14.2673  10.7067
ValFun  Gradients: u

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   7.0494   4.9742  17.3464  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0004   0.0016   6.6368   2.2852   2.4929
***** Episode 94069, Mean R = -17.1  Std R = 4.2  Min R = -26.7
PolicyLoss: -0.0195
Policy_Beta: 0.0338
Policy_Entropy: 0.167
Policy_KL: 0.000116
Policy_SD: 0.522
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.47e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 9.64e-05


ADV1:  -0.0008887948350355092 0.010392348645038286 0.06393251730805949 -0.177223772029118
ADV2:  0.036062775949393694 0.6747793949517216 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   6.5349   3.8756  11.7299  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0023   6.6368   2.2852   2.4929
***** Episode 94100, Mean R = -16.9  Std R = 4.7  Min R = -32.1
PolicyLoss: -0.0327
Policy_Beta: 0.0506
Policy_Entropy: 0.165
Policy_KL: 0.0

ADV1:  -0.000446465189214586 0.00958181162708119 0.04590032075878969 -0.06230867050501869
ADV2:  0.025475404792209503 0.8624970560486772 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4441   1.0600   4.7617  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0013   6.6368   2.2852   2.4929
***** Episode 94348, Mean R = -17.6  Std R = 6.1  Min R = -35.0
PolicyLoss: -0.0259
Policy_Beta: 0.114
Policy_Entropy: 0.164
Policy_KL: 0.0011
Policy_SD: 0.542
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 3.48e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 8.8e-05


ADV1:  0.0011236819449571263 0.008931220583897361 0.0555622845535646 -0.05677857161791484
ADV2:  0.011818913571497041 0.8740665607002055 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.1334   1.7407   9.2072  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0030   6.6368   2.2852   2.4929


***** Episode 94596, Mean R = -18.2  Std R = 4.6  Min R = -28.6
PolicyLoss: -0.00812
Policy_Beta: 0.114
Policy_Entropy: 0.165
Policy_KL: 0.00112
Policy_SD: 0.536
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 3.49e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 6.45e-05


ADV1:  -0.0001821230713476598 0.009076241036199422 0.04131279401895549 -0.06534835369425113
ADV2:  0.014716147664984228 0.907828944723743 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7179   0.7100   3.5866  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0012   6.6368   2.2852   2.4929
***** Episode 94627, Mean R = -17.9  Std R = 4.4  Min R = -28.5
PolicyLoss: -0.0165
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.00104
Policy_SD: 0.535
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 3.49e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 7.56e-05


ADV1:  -0.0006809607800515367 0.00931486332731

cs_angles |  0.0007  0.0008 |  0.0844  0.0825 | -0.9972 -0.9694 |  0.9932  0.9881
optical_flow | -0.0001  0.0002 |  0.0234  0.0246 | -1.1792 -1.1552 |  0.9560  0.9571
v_err    | -0.0095 |  0.0545 | -0.4533 |  0.1047
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.02
tracking_rewards |  -22.14 |    4.13 |  -38.16 |  -14.95
steps    |     376 |      21 |     333 |     419
***** Episode 94906, Mean R = -17.5  Std R = 5.2  Min R = -30.6
PolicyLoss: -0.0285
Policy_Beta: 0.114
Policy_Entropy: 0.164
Policy_KL: 0.00125
Policy_SD: 0.546
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.5e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 5.95e-05


ADV1:  -0.0017603778632513654 0.009147591005135236 0.05690406368351164 -0.07559712161719989
ADV2:  0.03256197495971186 0.854950058999947 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1946   0.4422   1.9836  37.2774  23.1806  15.1808
ValFun  Gradients: 

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.05   -0.04 |    0.68    1.87 |   -1.49   -3.13 |    1.43    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.31 |    0.31 |   -2.82 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    2.86
seeker_angles |    0.00   -0.00 |    0.09    0.09 |   -0.99   -0.96 |    1.00    1.00
cs_angles |  0.0010 -0.0002 |  0.0876  0.0865 | -0.9893 -0.9573 |  0.9977  0.9964
optical_flow | -0.0000 -0.0000 |  0.0246  0.0247 | -1.1486 -0.9019 |  1.3156  1.1116
v_err    | -0.0097 |  0.0545 | -0.4522 |  0.0998
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -22.85 |    4.99 |  -43.20 |  -14.21
steps    |     379 |  

attitude |   -0.07    0.00   -0.00 |    1.17    0.64    1.86 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.00    0.00 |    0.65    1.86 |   -1.35   -3.07 |    1.54    3.12
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.29 |    0.26 |   -2.18 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.83
seeker_angles |    0.00   -0.00 |    0.09    0.08 |   -0.99   -0.98 |    1.00    0.99
cs_angles |  0.0009 -0.0004 |  0.0851  0.0825 | -0.9898 -0.9753 |  0.9996  0.9893
optical_flow | -0.0000  0.0001 |  0.0243  0.0245 | -1.2928 -1.1599 |  1.1405  1.0590
v_err    | -0.0098 |  0.0546 | -0.4514 |  0.1070
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.06
a_f      |    0.04    0.20 |    0.69    1.83 |   -1.49   -3.13 |    1.52    3.11
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.28 |    0.28 |   -2.68 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.92
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.97 |    1.00    0.99
cs_angles |  0.0045  0.0001 |  0.0832  0.0830 | -0.9899 -0.9676 |  0.9974  0.9869
optical_flow |  0.0000  0.0001 |  0.0240  0.0245 | -1.0677 -1.0581 |  1.1417  1.0831
v_err    | -0.0096 |  0.0542 | -0.4522 |  0.1044
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -22.07 |    4.39 |  -38.31 |  -14.47
steps    |     378 |  

attitude |   -0.07   -0.01   -0.09 |    1.30    0.69    1.86 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.10    0.07    0.07
a_f      |   -0.02   -0.05 |    0.69    1.86 |   -1.45   -3.12 |    1.46    3.12
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.29 |    0.29 |   -3.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.11
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -1.00   -0.99 |    0.99    0.99
cs_angles |  0.0021  0.0028 |  0.0866  0.0816 | -0.9997 -0.9866 |  0.9880  0.9905
optical_flow |  0.0001 -0.0000 |  0.0240  0.0245 | -0.8777 -1.1719 |  0.9480  1.1757
v_err    | -0.0094 |  0.0545 | -0.4522 |  0.1131
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.07    0.09   -0.07 |    1.14    0.65    1.84 |   -3.14   -1.57   -3.14 |    3.13    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |    0.08   -0.04 |    0.65    1.83 |   -1.39   -3.13 |    1.46    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.29 |    0.29 |   -2.15 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.30 |    0.00 |    2.94
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    0.99
cs_angles |  0.0040  0.0008 |  0.0813  0.0824 | -0.9888 -0.9886 |  0.9963  0.9907
optical_flow | -0.0000 -0.0000 |  0.0249  0.0246 | -1.2024 -1.1819 |  1.1669  1.1763
v_err    | -0.0093 |  0.0544 | -0.4979 |  0.1137
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |    0.01    0.01 |    0.62    1.88 |   -1.48   -3.05 |    1.37    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.01 |    0.03    0.02    0.02
w_rewards |   -0.26 |    0.27 |   -2.37 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.92
seeker_angles |   -0.00    0.00 |    0.09    0.08 |   -0.99   -0.98 |    1.00    1.00
cs_angles | -0.0002  0.0032 |  0.0870  0.0824 | -0.9897 -0.9783 |  0.9957  0.9978
optical_flow | -0.0000  0.0001 |  0.0243  0.0251 | -1.1632 -0.9725 |  0.9806  1.1628
v_err    | -0.0088 |  0.0547 | -0.4529 |  0.1021
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.07 |    0.01
tracking_rewards |  -22.45 |    4.35 |  -36.72 |  -13.91
steps    |     377 |  

att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.04    0.00    0.23 |    1.21    0.62    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.53    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.00    0.20 |    0.64    1.82 |   -1.40   -3.14 |    1.43    3.14
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.28 |    0.31 |   -2.68 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.08
seeker_angles |   -0.00    0.00 |    0.09    0.08 |   -0.98   -0.97 |    1.00    1.00
cs_angles | -0.0008  0.0027 |  0.0864  0.0831 | -0.9829 -0.9710 |  0.9980  0.9965
optical_flow |  0.0001  0.0001 |  0.0234  0.0247 | -0.9157 -0.9406 |  1.0748  1.1033
v_err    | -0.0087 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.01    0.07 |    0.67    1.92 |   -1.46   -3.14 |    1.39    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.28 |    0.30 |   -2.47 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.92
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.99 |    1.00    0.97
cs_angles |  0.0046  0.0024 |  0.0823  0.0829 | -0.9781 -0.9944 |  0.9974  0.9686
optical_flow | -0.0001  0.0000 |  0.0238  0.0252 | -1.1919 -1.1591 |  1.0040  1.1513
v_err    | -0.0090 |  0.0549 | -0.4528 |  0.1104
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -22.11 |    4.60 |  -40.64 |  -13.96
steps    |     376 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |    0.04    0.07 |    0.66    1.86 |   -1.53   -3.12 |    1.49    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.29 |    0.26 |   -1.77 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.01
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.95    1.00
cs_angles |  0.0020  0.0023 |  0.0842  0.0825 | -0.9963 -0.9938 |  0.9494  0.9998
optical_flow | -0.0000 -0.0000 |  0.0240  0.0246 | -1.0826 -1.0917 |  1.1672  1.1515
v_err    | -0.0089 |  0.0546 | -0.4535 |  0.1132
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -22.28 |    4.69 |  -48.52 |  -13.91
steps    |     377 |  

thrust   |   -0.00    0.00    0.00 |    0.68    0.69    0.69 |   -3.46   -3.44   -3.46 |    3.44    3.43    3.46
norm_thrust |    0.91 |    0.77 |    0.00 |    3.46
fuel     |    1.56 |    0.19 |    1.10 |    2.17
rewards  |  -17.82 |    5.77 |  -43.10 |   -7.21
fuel_rewards |   -4.46 |    0.53 |   -6.21 |   -3.15
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.93 |   12.49 |    0.01 |  363.00
norm_af  |    1.72 |    0.92 |    0.05 |    3.25
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.03   -0.02   -0.04 |    1.18    0.66    1.81 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.08    0.07
a_f      |   -0.01   -0.03 |    0.66

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3015   1.0756   4.3739  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0025   6.6368   2.2852   2.4929
Update Cnt = 3170    ET =    946.3   Stats:  Mean, Std, Min, Max
r_f      |   10.09   14.10   -6.23 |  177.52  181.40  200.74 | -387.20 -385.27 -382.94 |  398.09  388.96  391.89
v_f      |   -0.00   -0.00    0.00 |    0.05    0.04    0.05 |   -0.09   -0.10   -0.10 |    0.09    0.09    0.10
r_i      |   37.32   33.90   -0.01 |  683.96  646.20  772.32 |-1306.74-1334.89-1297.23 | 1287.28 1316.27 1266.60
v_i      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.09    0.10
norm_rf  |    0.21 |    0.08 |    0.03 |    0.42
norm_vf  |    0.08 |    0.01 |    0.04 |    0.13
gs_f     |    1.34 |    1.97 |    0.01 |   18.77
thrust   |   -0.00   -0.00    0.00 |    0.69    0.68    0.69 |   -3.43   -3.44   -3.46 |    3.45    3.45    3.46
norm_thrust |    

ADV1:  0.0010480432466014235 0.005253269001286259 0.04799553681376917 -0.033583809631135275
ADV2:  -0.021419151105252575 0.911352308407756 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8643   0.9840   5.3709  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0027   6.6368   2.2852   2.4929
***** Episode 98595, Mean R = -16.1  Std R = 4.5  Min R = -27.7
PolicyLoss: 0.00435
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.0012
Policy_SD: 0.52
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.64e+07
VF_0_ExplainedVarNew: 0.995
VF_0_ExplainedVarOld: 0.994
VF_0_Loss : 2.38e-05


ADV1:  0.0009456040046995471 0.008145224440724888 0.042941241262872104 -0.13260769188507815
ADV2:  0.022403625046253074 0.7024374703646675 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6267   0.7924   4.0684  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0026   6.6368   2.2852   2

***** Episode 98843, Mean R = -17.6  Std R = 5.9  Min R = -35.3
PolicyLoss: -0.0244
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.00112
Policy_SD: 0.528
Policy_lr_mult: 0.0878
Steps: 1.18e+04
TotalSteps: 3.65e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 5.11e-05


ADV1:  -0.0024883594924218484 0.009749442887520365 0.04250377261899213 -0.06875964527807027
ADV2:  0.04070000883092979 0.8711591309312816 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9732   0.5482   2.6789  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0018   0.0065   6.6368   2.2852   2.4929
***** Episode 98874, Mean R = -17.8  Std R = 5.9  Min R = -34.5
PolicyLoss: -0.0248
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.000737
Policy_SD: 0.532
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 3.65e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 9.7e-05


ADV1:  0.005118102732624881 0.006228387716569985

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8467   0.9575   4.6703  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0002   0.0009   6.6368   2.2852   2.4929
***** Episode 99122, Mean R = -19.0  Std R = 6.6  Min R = -35.9
PolicyLoss: -0.0258
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.00147
Policy_SD: 0.529
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.66e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 8.57e-05


ADV1:  0.0003965330108309042 0.009866248381084453 0.19759751158773275 -0.06865331967016707
ADV2:  0.0008921301524397608 0.8001857353110504 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6238   1.0139   5.4487  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0014   6.6368   2.2852   2.4929
***** Episode 99153, Mean R = -18.2  Std R = 6.0  Min R = -31.7
PolicyLoss: -0.00666
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.0

ADV1:  0.000252495062326498 0.008085981611371439 0.07115012868778853 -0.08064648795809914
ADV2:  0.019384500144632374 0.8480780336364536 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8025   0.9083   4.4680  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0008   6.6368   2.2852   2.4929
***** Episode 99401, Mean R = -15.9  Std R = 4.6  Min R = -25.9
PolicyLoss: -0.0257
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000752
Policy_SD: 0.519
Policy_lr_mult: 0.0878
Steps: 1.19e+04
TotalSteps: 3.67e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 7.09e-05


ADV1:  -0.0006316785311346101 0.007738485714806138 0.0730583764490701 -0.07201957892029331
ADV2:  0.021655063918033506 0.8429521101439292 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6642   1.5329   8.1521  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0022   6.6368   2.2852   2

***** Episode 99649, Mean R = -17.8  Std R = 5.0  Min R = -36.3
PolicyLoss: -0.0247
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.0009
Policy_SD: 0.546
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.68e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.000145


ADV1:  -0.0015957691006776601 0.0080940059997298 0.054715525843035295 -0.06811890146330202
ADV2:  0.025033781900663993 0.8816542552327535 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3360   1.1321   6.4032  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0016   0.0062   6.6368   2.2852   2.4929
***** Episode 99680, Mean R = -17.6  Std R = 5.2  Min R = -30.8
PolicyLoss: -0.0152
Policy_Beta: 0.114
Policy_Entropy: 0.165
Policy_KL: 0.00131
Policy_SD: 0.537
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 3.68e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 6.73e-05


ADV1:  -0.001143166752014023 0.01075975301486161

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5466   1.0497   5.3856  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0051   6.6368   2.2852   2.4929
***** Episode 99928, Mean R = -18.8  Std R = 4.2  Min R = -27.8
PolicyLoss: -0.0239
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.00124
Policy_SD: 0.543
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 3.69e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.000101


ADV1:  -0.0005632211909509037 0.007702674576061038 0.05044521732135604 -0.05701203384686293
ADV2:  0.014227011762178388 0.8550927830962317 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2467   1.2170   5.5345  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0016   6.6368   2.2852   2.4929
***** Episode 99959, Mean R = -16.7  Std R = 4.6  Min R = -28.2
PolicyLoss: -0.0126
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.00

ADV1:  0.0012736000085436894 0.00858088975388517 0.09575068398978248 -0.07339180709479681
ADV2:  0.001434763199321836 0.7986932448247412 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8530   0.9737   5.2968  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0010   0.0041   6.6368   2.2852   2.4929
***** Episode 100207, Mean R = -17.8  Std R = 6.1  Min R = -41.7
PolicyLoss: -0.0167
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.00121
Policy_SD: 0.527
Policy_lr_mult: 0.0878
Steps: 1.18e+04
TotalSteps: 3.7e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.000162


ADV1:  -0.000576458874222711 0.00860040166236696 0.06441563486926183 -0.05734649781911838
ADV2:  0.01713897645183803 0.8602079549418731 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1770   1.2466   6.1495  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   6.6368   2.2852   2.49

seeker_angles |   -0.00    0.00 |    0.09    0.08 |   -0.99   -1.00 |    0.95    1.00
cs_angles | -0.0018  0.0010 |  0.0853  0.0827 | -0.9944 -0.9973 |  0.9491  0.9995
optical_flow | -0.0001  0.0000 |  0.0236  0.0238 | -1.1843 -1.1930 |  0.9923  1.3381
v_err    | -0.0091 |  0.0551 | -0.4525 |  0.0976
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -22.37 |    4.46 |  -37.12 |  -13.60
steps    |     377 |      21 |     332 |     418
***** Episode 100486, Mean R = -17.3  Std R = 4.6  Min R = -30.2
PolicyLoss: -0.0221
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.0011
Policy_SD: 0.522
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.71e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000241


ADV1:  -0.0016187711521273933 0.007141392117181835 0.08680686296893358 -0.04756017780394123
ADV2:  0.03375722869257977 0.8324468295573553 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/

attitude |    0.09    0.05    0.27 |    1.33    0.63    1.95 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |    0.05    0.23 |    0.63    1.98 |   -1.24   -3.13 |    1.53    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.27 |    0.28 |   -2.32 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.02
seeker_angles |    0.00   -0.00 |    0.09    0.08 |   -1.00   -0.96 |    1.00    1.00
cs_angles |  0.0025 -0.0002 |  0.0857  0.0803 | -0.9983 -0.9558 |  0.9987  0.9958
optical_flow | -0.0000  0.0001 |  0.0236  0.0247 | -1.2747 -1.1907 |  1.1406  1.1177
v_err    | -0.0089 |  0.0548 | -0.4525 |  0.1101
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.07   -0.01    0.09 |    1.14    0.62    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.07   -0.08 |    0.08    0.07    0.07
a_f      |   -0.02    0.09 |    0.63    1.83 |   -1.51   -3.13 |    1.44    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.03 |    0.03    0.02    0.02
w_rewards |   -0.30 |    0.43 |   -6.16 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.30 |    0.00 |    2.89
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0025  0.0021 |  0.0827  0.0808 | -0.9963 -0.9932 |  0.9976  0.9900
optical_flow |  0.0000  0.0000 |  0.0253  0.0260 | -1.1788 -1.3064 |  1.1329  1.0847
v_err    | -0.0088 |  0.0558 | -0.6587 |  0.1034
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.08   -0.02   -0.15 |    1.14    0.62    1.77 |   -3.14   -1.54   -3.14 |    3.14    1.53    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.02   -0.15 |    0.63    1.78 |   -1.45   -3.12 |    1.46    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.28 |    0.32 |   -2.58 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.02
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -1.00   -1.00 |    1.00    0.99
cs_angles |  0.0004  0.0028 |  0.0859  0.0829 | -0.9957 -0.9998 |  0.9968  0.9938
optical_flow |  0.0000 -0.0001 |  0.0256  0.0251 | -1.1618 -1.1997 |  1.1423  1.1943
v_err    | -0.0084 |  0.0547 | -0.4526 |  0.1138
landing_rewards |    9.19 |    2.72 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.00   -0.01 |    0.68    0.68    0.69 |   -3.38   -3.46   -3.46 |    3.39    3.44    3.45
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.54 |    0.17 |    1.06 |    2.27
rewards  |  -17.39 |    5.62 |  -57.18 |   -7.79
fuel_rewards |   -4.42 |    0.50 |   -6.51 |   -3.03
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.78 |   12.45 |    0.01 |  460.90
norm_af  |    1.82 |    0.90 |    0.10 |    3.29
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.02    0.03    0.08 |    1.29    0.69    1.90 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |    0.02    0.11 |    0.69

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8062   0.5586   3.1800  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0014   0.0053   6.6368   2.2852   2.4929
Update Cnt = 3290    ET =    941.3   Stats:  Mean, Std, Min, Max
r_f      |    3.15    2.34    1.01 |  188.70  170.40  201.93 | -377.41 -376.52 -388.50 |  396.03  374.46  398.91
v_f      |   -0.00   -0.00   -0.00 |    0.05    0.04    0.05 |   -0.12   -0.09   -0.09 |    0.09    0.10    0.09
r_i      |    1.84   13.76   13.63 |  677.85  679.68  765.14 |-1289.04-1302.23-1297.72 | 1318.53 1267.71 1316.97
v_i      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.10
norm_rf  |    0.20 |    0.08 |    0.03 |    0.47
norm_vf  |    0.08 |    0.01 |    0.04 |    0.14
gs_f     |    1.27 |    2.15 |    0.01 |   20.72
thrust   |    0.00   -0.00    0.00 |    0.68    0.68    0.68 |   -3.38   -3.46   -3.38 |    3.43    3.46    3.45
norm_thrust |    

ADV1:  0.004121577058758274 0.007922741797501954 0.17486451107999457 -0.06381203080017933
ADV2:  -0.019450445660182347 0.8383667842336566 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2645   0.5786   3.0885  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0042   0.0026   0.0105   6.6368   2.2852   2.4929
***** Episode 102315, Mean R = -17.8  Std R = 7.5  Min R = -45.3
PolicyLoss: -0.0138
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.0009
Policy_SD: 0.531
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 3.78e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.00017


ADV1:  0.0013451349242661033 0.006997668572719141 0.0596896960895788 -0.11178355803950346
ADV2:  0.00766899514186164 0.8135793989514576 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1678   0.5805   2.8891  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0011   0.0040   6.6368   2.2852   2.492

***** Episode 102563, Mean R = -17.4  Std R = 5.3  Min R = -31.6
PolicyLoss: -0.0175
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.00102
Policy_SD: 0.53
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.79e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 0.000279


ADV1:  0.00469785123534637 0.008816844781174957 0.04300368061051083 -0.05632761564941091
ADV2:  -0.018381628639215768 0.8926598031500039 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2873   1.0572   5.3136  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0048   0.0030   0.0123   6.6368   2.2852   2.4929
***** Episode 102594, Mean R = -18.0  Std R = 9.9  Min R = -60.3
PolicyLoss: -0.0234
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.00123
Policy_SD: 0.536
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.79e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000171


ADV1:  0.0008089804454404081 0.0075654841428834

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0345   1.0720   4.9713  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0020   6.6368   2.2852   2.4929
***** Episode 102842, Mean R = -16.9  Std R = 4.2  Min R = -28.8
PolicyLoss: -0.0307
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.00087
Policy_SD: 0.537
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.8e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000251


ADV1:  -0.0003653954505502781 0.009022164228164582 0.04999710086235437 -0.062392283028949724
ADV2:  0.02250147941159028 0.8627684804887907 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0869   0.9878   4.6994  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0010   6.6368   2.2852   2.4929
***** Episode 102873, Mean R = -17.1  Std R = 4.8  Min R = -27.8
PolicyLoss: -0.024
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.00

ADV1:  0.00017889584820409695 0.007502149986086644 0.08191584147491116 -0.0915715277528028
ADV2:  0.023011236998885454 0.7939550778473239 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2188   1.1705   5.8884  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0002   0.0007   6.6368   2.2852   2.4929
***** Episode 103121, Mean R = -17.7  Std R = 6.4  Min R = -36.1
PolicyLoss: -0.029
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.001
Policy_SD: 0.538
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.81e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.00027


ADV1:  4.990020979575018e-06 0.006793938176757441 0.058670709810819954 -0.07109184879259856
ADV2:  0.010995001769698688 0.8157206076772028 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.1542   2.2778  10.8273  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0004   6.6368   2.2852   2.4

***** Episode 103369, Mean R = -16.4  Std R = 4.6  Min R = -26.1
PolicyLoss: 0.0117
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.0011
Policy_SD: 0.523
Policy_lr_mult: 0.0878
Steps: 1.15e+04
TotalSteps: 3.82e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 6.15e-05


ADV1:  -0.002904503272058441 0.008688794981123307 0.04451477296611839 -0.06894061529083592
ADV2:  0.04564350656574233 0.8611427381750294 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1675   1.0440   5.4073  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0020   0.0075   6.6368   2.2852   2.4929
***** Episode 103400, Mean R = -17.1  Std R = 5.1  Min R = -28.3
PolicyLoss: -0.0277
Policy_Beta: 0.114
Policy_Entropy: 0.165
Policy_KL: 0.00109
Policy_SD: 0.537
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.82e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.000163


ADV1:  0.0021937911139120365 0.006267861375890102

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3887   0.5297   2.7237  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0017   6.6368   2.2852   2.4929
***** Episode 103648, Mean R = -17.9  Std R = 5.5  Min R = -32.9
PolicyLoss: -0.0209
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.00121
Policy_SD: 0.536
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.83e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.000185


ADV1:  -0.0006920074904423383 0.007991131780234565 0.16948955526172005 -0.0616599309586755
ADV2:  0.020286544331724166 0.8278403274989596 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6301   1.2244   5.6568  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0021   6.6368   2.2852   2.4929
***** Episode 103679, Mean R = -17.5  Std R = 5.3  Min R = -32.4
PolicyLoss: -0.0176
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.0

ADV1:  -0.0014098688896912787 0.007363190083670326 0.03873938719867953 -0.060283645116923856
ADV2:  0.03687698852197329 0.8530388328593131 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7466   0.8791   4.2864  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0011   0.0037   6.6368   2.2852   2.4929
***** Episode 103927, Mean R = -17.9  Std R = 4.7  Min R = -25.3
PolicyLoss: -0.0276
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.00119
Policy_SD: 0.536
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 3.84e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.000123


ADV1:  -0.0004841332931252885 0.01019001594408343 0.06817464994141542 -0.10077319673144491
ADV2:  0.025339982514738273 0.8635731219307389 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1992   1.0498   4.2370  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0022   6.6368   2.2852   

seeker_angles |    0.00    0.00 |    0.09    0.08 |   -0.96   -1.00 |    0.99    0.99
cs_angles |  0.0027  0.0010 |  0.0853  0.0821 | -0.9643 -0.9999 |  0.9907  0.9949
optical_flow |  0.0000 -0.0000 |  0.0233  0.0247 | -1.0646 -1.0609 |  0.9695  1.1548
v_err    | -0.0092 |  0.0551 | -0.4536 |  0.1331
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.01
tracking_rewards |  -22.46 |    4.31 |  -39.44 |  -13.65
steps    |     376 |      20 |     333 |     414
***** Episode 104206, Mean R = -19.3  Std R = 7.2  Min R = -38.7
PolicyLoss: -0.015
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.000829
Policy_SD: 0.539
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.85e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.000302


ADV1:  0.003573779068267247 0.009518057633823549 0.05137185333626809 -0.05117575695201893
ADV2:  -0.01561090420925057 0.8955174581794977 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/M

fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.30 |    0.00 |    3.01
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.97   -0.99 |    0.99    0.99
cs_angles |  0.0012  0.0008 |  0.0828  0.0812 | -0.9715 -0.9872 |  0.9908  0.9939
optical_flow |  0.0000  0.0001 |  0.0224  0.0239 | -0.8143 -1.1626 |  1.2268  0.9511
v_err    | -0.0091 |  0.0548 | -0.4532 |  0.1085
landing_rewards |    9.23 |    2.67 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -22.05 |    4.39 |  -40.28 |  -13.84
steps    |     376 |      21 |     330 |     418
***** Episode 104516, Mean R = -18.3  Std R = 6.2  Min R = -32.9
PolicyLoss: -0.0322
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.000923
Policy_SD: 0.537
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 3.86e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.000371


ADV1:  -0.0014250226441173102 0.009809365978518308 0.04760719206030156 -0.1004

attitude |    0.00    0.01   -0.22 |    1.14    0.66    1.79 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.08
a_f      |    0.01   -0.32 |    0.66    1.79 |   -1.51   -3.14 |    1.46    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.30 |    0.34 |   -2.82 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    2.81
seeker_angles |    0.00   -0.00 |    0.09    0.08 |   -0.99   -1.00 |    0.96    0.98
cs_angles |  0.0006 -0.0004 |  0.0850  0.0841 | -0.9860 -0.9983 |  0.9635  0.9781
optical_flow |  0.0001  0.0000 |  0.0241  0.0245 | -1.0165 -1.0313 |  1.1304  0.9488
v_err    | -0.0089 |  0.0549 | -0.4754 |  0.1063
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |    0.07    0.16 |    0.60    1.89 |   -1.51   -3.12 |    1.48    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.32 |    0.30 |   -2.60 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    2.69
seeker_angles |   -0.00    0.00 |    0.09    0.08 |   -0.99   -0.92 |    1.00    0.99
cs_angles | -0.0016  0.0037 |  0.0890  0.0827 | -0.9879 -0.9242 |  0.9971  0.9917
optical_flow |  0.0000  0.0001 |  0.0234  0.0244 | -0.9704 -1.1379 |  1.1368  1.1552
v_err    | -0.0093 |  0.0547 | -0.4522 |  0.1150
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -22.70 |    5.51 |  -79.15 |  -14.97
steps    |     377 |  

attitude |    0.10    0.00    0.00 |    1.19    0.69    1.81 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.01   -0.02 |    0.68    1.79 |   -1.48   -3.13 |    1.32    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.03 |    0.04    0.03    0.02
w_rewards |   -0.30 |    0.34 |   -2.89 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.30 |    0.00 |    2.91
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.96 |    0.99    1.00
cs_angles |  0.0031  0.0005 |  0.0817  0.0805 | -0.9913 -0.9600 |  0.9932  0.9962
optical_flow | -0.0001 -0.0001 |  0.0247  0.0247 | -1.1153 -1.1806 |  1.0588  0.9183
v_err    | -0.0092 |  0.0548 | -0.4531 |  0.1060
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01   -0.02    0.09 |    1.10    0.69    1.74 |   -3.14   -1.54   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |   -0.02    0.15 |    0.70    1.73 |   -1.53   -3.12 |    1.49    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.29 |    0.28 |   -2.60 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.30 |    0.00 |    2.89
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -0.99   -1.00 |    0.99    0.97
cs_angles |  0.0010  0.0008 |  0.0854  0.0832 | -0.9883 -0.9989 |  0.9922  0.9681
optical_flow | -0.0000  0.0001 |  0.0240  0.0236 | -1.0818 -1.0293 |  1.0833  1.0326
v_err    | -0.0093 |  0.0549 | -0.4567 |  0.1098
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.07    0.07    0.08
a_f      |    0.00   -0.08 |    0.67    1.89 |   -1.46   -3.13 |    1.46    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.26 |    0.22 |   -1.45 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.30 |    0.00 |    2.74
seeker_angles |   -0.00   -0.00 |    0.08    0.08 |   -1.00   -1.00 |    0.99    1.00
cs_angles | -0.0006 -0.0018 |  0.0840  0.0828 | -0.9990 -0.9982 |  0.9914  0.9980
optical_flow | -0.0000  0.0001 |  0.0243  0.0250 | -1.1321 -1.1902 |  1.1162  1.1052
v_err    | -0.0092 |  0.0549 | -0.4526 |  0.0996
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -22.01 |    4.08 |  -33.28 |  -14.41
steps    |     378 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.02    0.06 |    0.67    1.84 |   -1.49   -3.11 |    1.47    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.31 |    0.33 |   -2.31 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.30 |    0.00 |    3.01
seeker_angles |   -0.00   -0.00 |    0.09    0.08 |   -0.98   -1.00 |    0.94    0.99
cs_angles | -0.0008 -0.0003 |  0.0851  0.0836 | -0.9830 -1.0000 |  0.9411  0.9939
optical_flow |  0.0001 -0.0001 |  0.0244  0.0254 | -1.3120 -1.1309 |  1.0291  1.2093
v_err    | -0.0091 |  0.0551 | -0.4566 |  0.1251
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.01
tracking_rewards |  -22.20 |    4.74 |  -49.03 |  -14.17
steps    |     379 |  

attitude |   -0.02    0.03   -0.19 |    1.20    0.64    1.86 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |    0.03   -0.24 |    0.64    1.87 |   -1.43   -3.13 |    1.55    3.12
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.30 |    0.29 |   -1.82 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.30 |    0.00 |    3.03
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -0.98   -0.95 |    0.98    0.99
cs_angles |  0.0019 -0.0003 |  0.0796  0.0830 | -0.9779 -0.9523 |  0.9822  0.9940
optical_flow | -0.0001 -0.0001 |  0.0247  0.0252 | -1.0516 -1.0317 |  1.3245  1.0710
v_err    | -0.0092 |  0.0550 | -0.4532 |  0.1012
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.00    0.00 |    0.68    0.68    0.69 |   -3.42   -3.44   -3.39 |    3.32    3.46    3.43
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.55 |    0.19 |    1.08 |    2.19
rewards  |  -17.05 |    5.39 |  -34.11 |   -7.44
fuel_rewards |   -4.43 |    0.55 |   -6.28 |   -3.09
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.96 |   13.16 |    0.01 |  309.33
norm_af  |    1.74 |    0.90 |    0.08 |    3.42
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.06    0.00    0.08 |    1.24    0.70    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.10    0.07    0.07
a_f      |   -0.00    0.05 |    0.70

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9459   1.2098   6.6929  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0038   6.6368   2.2852   2.4929
Update Cnt = 3460    ET =   1092.7   Stats:  Mean, Std, Min, Max
r_f      |    5.00   10.21    4.27 |  182.90  167.88  208.05 | -387.77 -366.91 -382.73 |  394.85  381.59  390.51
v_f      |   -0.00    0.00   -0.00 |    0.05    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.10    0.10
r_i      |   16.43   23.05   42.94 |  696.07  637.64  770.29 |-1381.73-1270.35-1264.68 | 1300.25 1260.88 1306.53
v_i      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.09    0.09
norm_rf  |    0.20 |    0.08 |    0.04 |    0.48
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.13 |    1.32 |    0.01 |   10.79
thrust   |   -0.00    0.00    0.01 |    0.70    0.69    0.70 |   -3.46   -3.42   -3.45 |    3.45    3.44    3.45
norm_thrust |    

ADV1:  -0.0004265263874407279 0.008243118629738984 0.05698316894479616 -0.08341949674261592
ADV2:  0.034108622037785336 0.8001291953200148 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7482   0.8838   3.7422  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0006   0.0019   6.6368   2.2852   2.4929
***** Episode 107585, Mean R = -17.3  Std R = 5.5  Min R = -31.4
PolicyLoss: -0.0349
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.00126
Policy_SD: 0.541
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 3.97e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.000114


ADV1:  0.0005683062775384328 0.0065788193759175224 0.034563062923282706 -0.04566991134618466
ADV2:  0.010455364121991753 0.8856448568335032 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9512   0.9953   4.1959  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0015   6.6368   2.2852

***** Episode 107833, Mean R = -15.8  Std R = 5.0  Min R = -33.2
PolicyLoss: -0.0265
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.00144
Policy_SD: 0.525
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 3.98e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 5.88e-05


ADV1:  0.00026495664915316574 0.007717785236429038 0.0348905515240332 -0.06602833729479753
ADV2:  0.02149659358507836 0.8503075470986057 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9986   1.4275   6.1873  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0008   6.6368   2.2852   2.4929
***** Episode 107864, Mean R = -15.7  Std R = 5.9  Min R = -33.1
PolicyLoss: -0.028
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.00101
Policy_SD: 0.528
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 3.98e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 9.27e-05


ADV1:  0.00040323486756298335 0.0060741553211111

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.9684   1.7711   9.2746  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0034   6.6368   2.2852   2.4929
***** Episode 108112, Mean R = -16.7  Std R = 5.8  Min R = -30.6
PolicyLoss: -0.0282
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.00126
Policy_SD: 0.529
Policy_lr_mult: 0.0878
Steps: 1.18e+04
TotalSteps: 3.99e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 9.26e-05


ADV1:  0.0014522689459506417 0.005276213256639537 0.0487028270073242 -0.035509962963961694
ADV2:  -0.0224131299125181 0.9011372716914168 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.5916   2.6413  14.0883  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0045   6.6368   2.2852   2.4929
***** Episode 108143, Mean R = -16.5  Std R = 5.0  Min R = -29.1
PolicyLoss: -0.00167
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.0

ADV1:  0.002132127192471689 0.00846266522415989 0.04429715350992225 -0.052699276303129636
ADV2:  0.004842965301501892 0.8881956162618007 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7740   0.9406   4.9424  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0038   0.0015   0.0060   6.6368   2.2852   2.4929
***** Episode 108391, Mean R = -15.9  Std R = 5.1  Min R = -28.6
PolicyLoss: -0.0218
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.000803
Policy_SD: 0.517
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 4e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 6.84e-05


ADV1:  0.0021189174214879167 0.008871728408247426 0.048797573557039065 -0.18587057939135843
ADV2:  0.003462269843396552 0.8012823036523521 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3824   1.3374   7.1529  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0012   0.0056   6.6368   2.2852   2.4

***** Episode 108639, Mean R = -17.5  Std R = 6.4  Min R = -35.3
PolicyLoss: -0.0151
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.00144
Policy_SD: 0.538
Policy_lr_mult: 0.0878
Steps: 1.18e+04
TotalSteps: 4.01e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 6.13e-05


ADV1:  -0.0013731401139440512 0.00926204679982498 0.06722127495761265 -0.05582046479305349
ADV2:  0.024695410508225914 0.8854772365364426 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.7199   1.7292   8.6676  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0008   0.0036   6.6368   2.2852   2.4929
***** Episode 108670, Mean R = -18.3  Std R = 6.4  Min R = -37.6
PolicyLoss: -0.0175
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00165
Policy_SD: 0.534
Policy_lr_mult: 0.0878
Steps: 1.18e+04
TotalSteps: 4.02e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 8.3e-05


ADV1:  -0.0013813240164026095 0.0097130760692384

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4372   0.7425   4.1028  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0010   0.0039   6.6368   2.2852   2.4929
***** Episode 108918, Mean R = -17.3  Std R = 5.8  Min R = -33.6
PolicyLoss: -0.0353
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.000955
Policy_SD: 0.543
Policy_lr_mult: 0.0878
Steps: 1.14e+04
TotalSteps: 4.02e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 8.17e-05


ADV1:  -0.00034299185296837465 0.007382986071538088 0.045192538134659344 -0.055934971051321114
ADV2:  0.01783801831745513 0.850744481310563 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7178   1.4529   7.1700  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   6.6368   2.2852   2.4929
***** Episode 108949, Mean R = -18.1  Std R = 6.2  Min R = -38.4
PolicyLoss: -0.0186
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0

ADV1:  0.00021479001166677266 0.009089101582456906 0.058960857503212394 -0.05690091008051883
ADV2:  0.020363318449159038 0.8526880810748446 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.5678   1.4546   8.4543  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0007   6.6368   2.2852   2.4929
***** Episode 109197, Mean R = -17.6  Std R = 6.8  Min R = -37.8
PolicyLoss: -0.026
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.00124
Policy_SD: 0.536
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 4.04e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.000126


ADV1:  0.000818770653728087 0.008810776371436057 0.038563019274778246 -0.05861413574334351
ADV2:  0.011793859797278757 0.8868656645687383 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5084   1.0017   5.1680  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0022   6.6368   2.2852  

seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.98    1.00
cs_angles | -0.0007  0.0041 |  0.0807  0.0830 | -0.9932 -0.9977 |  0.9820  0.9982
optical_flow |  0.0001 -0.0000 |  0.0244  0.0249 | -0.9629 -0.9708 |  1.0513  1.1798
v_err    | -0.0086 |  0.0546 | -0.4522 |  0.1043
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -21.83 |    4.37 |  -39.06 |  -13.74
steps    |     377 |      19 |     336 |     412
***** Episode 109476, Mean R = -17.5  Std R = 5.1  Min R = -30.2
PolicyLoss: -0.0175
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.00139
Policy_SD: 0.553
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 4.05e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.993
VF_0_Loss : 4.25e-05


ADV1:  -0.0008575335009544193 0.00873770137682906 0.054213414976735985 -0.05081717838448388
ADV2:  0.020783772199007303 0.8638992588721903 3.0 -3.0
Policy  Gradients: u/sd/Max/C Ma

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.01   -0.13 |    0.66    1.83 |   -1.53   -3.13 |    1.46    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.32 |    0.31 |   -2.59 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.79
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.97   -0.98 |    0.98    0.96
cs_angles | -0.0017  0.0009 |  0.0844  0.0817 | -0.9727 -0.9831 |  0.9817  0.9595
optical_flow |  0.0001  0.0001 |  0.0233  0.0235 | -1.2073 -1.0057 |  1.0191  0.9082
v_err    | -0.0085 |  0.0540 | -0.4523 |  0.1001
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -21.98 |    4.46 |  -40.08 |  -13.39
steps    |     378 |  

attitude |    0.06   -0.01   -0.17 |    1.21    0.70    1.78 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.05 |    0.10    0.07    0.07
a_f      |    0.01   -0.22 |    0.68    1.75 |   -1.49   -3.13 |    1.52    3.10
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.32 |    0.36 |   -3.56 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.91
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.95    0.99
cs_angles |  0.0005  0.0031 |  0.0848  0.0837 | -0.9939 -0.9951 |  0.9533  0.9895
optical_flow | -0.0001 -0.0001 |  0.0229  0.0233 | -0.8332 -1.1451 |  1.1290  0.8556
v_err    | -0.0085 |  0.0548 | -0.4537 |  0.1314
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.08    0.07
a_f      |   -0.00   -0.14 |    0.65    1.83 |   -1.47   -3.13 |    1.36    3.10
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.34 |    0.31 |   -2.27 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    2.96
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -0.97   -0.95 |    1.00    0.99
cs_angles |  0.0001  0.0034 |  0.0870  0.0842 | -0.9661 -0.9454 |  0.9990  0.9943
optical_flow |  0.0001  0.0001 |  0.0229  0.0236 | -0.9824 -1.0041 |  1.0950  1.1362
v_err    | -0.0085 |  0.0544 | -0.4530 |  0.1126
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -22.44 |    4.93 |  -41.26 |  -13.65
steps    |     377 |  

thrust   |   -0.00   -0.01   -0.01 |    0.68    0.68    0.68 |   -3.40   -3.46   -3.40 |    3.42    3.46    3.44
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.52 |    0.17 |    1.14 |    2.17
rewards  |  -17.14 |    5.47 |  -42.35 |   -6.81
fuel_rewards |   -4.36 |    0.48 |   -6.22 |   -3.25
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.77 |   12.55 |    0.00 |  980.28
norm_af  |    1.71 |    0.89 |    0.06 |    3.24
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.01   -0.04    0.02 |    1.24    0.67    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.03    0.01 |    0.68

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6265   1.2413   6.9477  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0016   0.0063   6.6368   2.2852   2.4929
Update Cnt = 3580    ET =   1159.4   Stats:  Mean, Std, Min, Max
r_f      |    6.69   -6.45    3.50 |  182.76  167.85  204.03 | -394.34 -383.99 -371.01 |  391.44  374.21  391.70
v_f      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.12   -0.11 |    0.11    0.10    0.09
r_i      |   26.94  -30.42    2.01 |  674.35  654.53  773.59 |-1373.00-1307.33-1335.91 | 1285.36 1246.85 1303.06
v_i      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.09 |    0.08    0.09    0.10
norm_rf  |    0.21 |    0.08 |    0.03 |    0.45
norm_vf  |    0.08 |    0.01 |    0.04 |    0.13
gs_f     |    1.23 |    1.51 |    0.01 |    9.83
thrust   |   -0.00    0.00   -0.01 |    0.68    0.68    0.69 |   -3.40   -3.44   -3.46 |    3.42    3.44    3.45
norm_thrust |    

ADV1:  0.0015676977339553584 0.009857693227830644 0.08812207740180272 -0.06657462129657538
ADV2:  -0.0004280368998672329 0.8697259188673867 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7507   1.0169   5.5717  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0014   0.0049   6.6368   2.2852   2.4929
***** Episode 111305, Mean R = -17.1  Std R = 4.1  Min R = -26.0
PolicyLoss: -0.0155
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000741
Policy_SD: 0.539
Policy_lr_mult: 0.0878
Steps: 1.15e+04
TotalSteps: 4.11e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.000121


ADV1:  -0.0005125562042348097 0.008637148346110323 0.04077938336157083 -0.12433257167340706
ADV2:  0.028225126260447035 0.8202383513939348 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1595   1.4661   7.5085  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   6.6368   2.285

***** Episode 111553, Mean R = -16.9  Std R = 5.9  Min R = -29.7
PolicyLoss: -0.0287
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000888
Policy_SD: 0.537
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 4.12e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.000291


ADV1:  0.0019492417766453865 0.012946974187074689 0.3151805627167752 -0.3262199467620851
ADV2:  -0.0030362528081176333 0.580689161701545 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3521   0.6936   3.8035  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0050   6.6368   2.2852   2.4929
***** Episode 111584, Mean R = -16.7  Std R = 5.4  Min R = -35.8
PolicyLoss: -0.0106
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.00118
Policy_SD: 0.528
Policy_lr_mult: 0.0878
Steps: 1.19e+04
TotalSteps: 4.12e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.965
VF_0_Loss : 0.000308


ADV1:  -0.0009165590024172699 0.01102309747409

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4436   1.3072   6.8779  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0005   0.0019   6.6368   2.2852   2.4929
***** Episode 111832, Mean R = -17.2  Std R = 5.5  Min R = -32.0
PolicyLoss: 0.0187
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00118
Policy_SD: 0.536
Policy_lr_mult: 0.0878
Steps: 1.18e+04
TotalSteps: 4.13e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000201


ADV1:  -0.001637506418269282 0.01600498838814349 0.30376974878789814 -0.14530836050928092
ADV2:  0.04202706124343417 0.6169492492495547 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3016   0.7097   3.2744  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0015   0.0057   6.6368   2.2852   2.4929
***** Episode 111863, Mean R = -19.1  Std R = 10.9  Min R = -70.2
PolicyLoss: -0.0387
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.0015

ADV1:  0.0022142301354580738 0.008418945515278067 0.05855555816410851 -0.11893703655682641
ADV2:  0.002480168344518567 0.7932317377864911 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1028   1.0107   5.5366  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0017   0.0060   6.6368   2.2852   2.4929
***** Episode 112111, Mean R = -18.0  Std R = 5.9  Min R = -30.2
PolicyLoss: -0.0275
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.00073
Policy_SD: 0.548
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 4.14e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00045


ADV1:  -0.000575277420277535 0.005846056882642694 0.043114768748499954 -0.08629508549820741
ADV2:  0.012540592902997756 0.8672358142170988 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7448   1.2657   6.1780  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0016   6.6368   2.2852   2

***** Episode 112359, Mean R = -16.2  Std R = 5.0  Min R = -30.9
PolicyLoss: -0.0139
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000804
Policy_SD: 0.535
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 4.15e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000262


ADV1:  -0.002150166910086769 0.00799390748842994 0.04080724379700995 -0.07309119832682615
ADV2:  0.044302321739059285 0.8348715579819498 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7307   0.8263   4.5468  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0056   6.6368   2.2852   2.4929
***** Episode 112390, Mean R = -16.4  Std R = 5.4  Min R = -31.1
PolicyLoss: -0.029
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.00117
Policy_SD: 0.532
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 4.15e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.000168


ADV1:  0.0010148887297709323 0.006990889760335

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4936   0.7876   4.4249  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   6.6368   2.2852   2.4929
***** Episode 112638, Mean R = -16.0  Std R = 4.0  Min R = -31.6
PolicyLoss: -0.0212
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000985
Policy_SD: 0.532
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 4.16e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.000119


ADV1:  -0.0006705228704196513 0.007398495711901385 0.0822126982108426 -0.06073836866666017
ADV2:  0.022793372329889518 0.8078557552719633 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2262   0.5335   2.4573  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0018   6.6368   2.2852   2.4929
***** Episode 112669, Mean R = -16.4  Std R = 4.5  Min R = -28.3
PolicyLoss: -0.0189
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.

ADV1:  -0.0014354914352265739 0.009171350837993367 0.04796141404511994 -0.061375350321072206
ADV2:  0.030440647301128675 0.8670013765331486 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1584   1.2758   6.5513  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0011   0.0038   6.6368   2.2852   2.4929
***** Episode 112917, Mean R = -17.6  Std R = 4.6  Min R = -28.4
PolicyLoss: -0.0232
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.000918
Policy_SD: 0.542
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 4.17e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.000114


ADV1:  0.00045160880132365195 0.00951319550701261 0.12826962448284274 -0.10105326042220286
ADV2:  0.020822551588434095 0.8363236513456792 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5028   1.4462   7.4764  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0003   0.0012   6.6368   2.2852

seeker_angles |    0.00    0.00 |    0.09    0.08 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0049  0.0011 |  0.0887  0.0830 | -0.9928 -0.9996 |  0.9995  0.9960
optical_flow | -0.0001 -0.0001 |  0.0255  0.0251 | -1.1507 -1.1670 |  1.2539  1.1322
v_err    | -0.0088 |  0.0548 | -0.4524 |  0.1100
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.04
tracking_rewards |  -22.29 |    5.65 |  -74.71 |  -13.91
steps    |     377 |      20 |     336 |     416
***** Episode 113196, Mean R = -18.4  Std R = 5.8  Min R = -31.9
PolicyLoss: -0.0241
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.00112
Policy_SD: 0.541
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 4.19e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.000105


ADV1:  0.0023682368092247546 0.007693812881469013 0.07286083908341157 -0.044284081582945056
ADV2:  -0.008304664818189278 0.9056960854223635 3.0 -3.0
Policy  Gradients: u/sd/Max/C Ma

attitude |   -0.05    0.01   -0.01 |    1.24    0.66    1.90 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |    0.01   -0.02 |    0.66    1.91 |   -1.54   -3.13 |    1.48    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.01 |    0.04    0.02    0.02
w_rewards |   -0.25 |    0.21 |   -1.18 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.85
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.97 |    1.00    0.97
cs_angles |  0.0040  0.0015 |  0.0823  0.0844 | -0.9780 -0.9675 |  0.9975  0.9672
optical_flow | -0.0000 -0.0000 |  0.0231  0.0244 | -1.0223 -1.1307 |  1.0537  1.1316
v_err    | -0.0092 |  0.0545 | -0.4533 |  0.1182
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.00   -0.00   -0.15 |    1.15    0.66    1.79 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |    0.00   -0.12 |    0.66    1.77 |   -1.42   -3.13 |    1.46    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.27 |    0.30 |   -2.40 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.93
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -0.96   -1.00 |    1.00    1.00
cs_angles |  0.0036 -0.0009 |  0.0834  0.0808 | -0.9640 -0.9999 |  0.9979  0.9964
optical_flow | -0.0001  0.0001 |  0.0227  0.0249 | -1.0207 -1.0609 |  1.1029  1.1339
v_err    | -0.0089 |  0.0549 | -0.4533 |  0.1052
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.01   -0.00    0.00 |    0.69    0.69    0.69 |   -3.46   -3.45   -3.44 |    3.44    3.46    3.44
norm_thrust |    0.91 |    0.77 |    0.00 |    3.46
fuel     |    1.55 |    0.18 |    1.19 |    2.20
rewards  |  -17.12 |    5.39 |  -34.28 |   -8.11
fuel_rewards |   -4.44 |    0.51 |   -6.30 |   -3.39
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.76 |   12.81 |    0.01 |  351.02
norm_af  |    1.72 |    0.88 |    0.12 |    3.35
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.09    0.05    0.02 |    1.16    0.67    1.80 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.09    0.07    0.06
a_f      |    0.06    0.04 |    0.67

ADV1:  -0.0012981750905948837 0.008989749580514914 0.048873740070685234 -0.06607437311370509
ADV2:  0.03602805192972889 0.8391258793288772 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.9082   2.1394  10.3057  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0034   6.6368   2.2852   2.4929
Update Cnt = 3690    ET =   1105.5   Stats:  Mean, Std, Min, Max
r_f      |    0.30   -6.39   -9.94 |  184.05  169.55  204.71 | -380.38 -381.81 -398.01 |  387.31  350.85  377.61
v_f      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.10   -0.11 |    0.10    0.09    0.10
r_i      |    2.56  -42.59  -37.18 |  700.33  637.78  763.91 |-1279.29-1290.54-1246.20 | 1380.33 1284.16 1292.33
v_i      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.09    0.09    0.10
norm_rf  |    0.20 |    0.08 |    0.04 |    0.51
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.32 |    1.98 | 

***** Episode 114684, Mean R = -17.4  Std R = 6.2  Min R = -37.5
PolicyLoss: -0.00514
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00098
Policy_SD: 0.538
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 4.24e+07
VF_0_ExplainedVarNew: 0.995
VF_0_ExplainedVarOld: 0.993
VF_0_Loss : 8.43e-05


ADV1:  -0.0005671616344928508 0.00782201990645132 0.09503953074728028 -0.06838744760261367
ADV2:  0.026399910685960613 0.8161038095624189 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8107   0.7541   4.0210  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0018   6.6368   2.2852   2.4929
***** Episode 114715, Mean R = -16.6  Std R = 4.9  Min R = -26.2
PolicyLoss: -0.0253
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.00116
Policy_SD: 0.533
Policy_lr_mult: 0.0878
Steps: 1.15e+04
TotalSteps: 4.24e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 7.83e-05


ADV1:  -0.0015479281315908745 0.0086376653567

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1337   1.6590   8.1939  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0075   6.6368   2.2852   2.4929
***** Episode 114963, Mean R = -16.3  Std R = 4.4  Min R = -26.1
PolicyLoss: -0.0139
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00119
Policy_SD: 0.541
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 4.25e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.000108


ADV1:  -0.001007306562770547 0.0071525695164757035 0.040049606502750246 -0.0813667114572808
ADV2:  0.030092766952974512 0.8510813220275393 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8394   0.9115   3.9442  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0027   6.6368   2.2852   2.4929
***** Episode 114994, Mean R = -16.2  Std R = 4.5  Min R = -27.9
PolicyLoss: -0.0247
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.001

ADV1:  0.0012703424484118715 0.005540461796584706 0.0728203548010416 -0.04620855153626474
ADV2:  -0.016776103256050952 0.8867940303282532 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0586   1.5776   7.6484  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0010   0.0035   6.6368   2.2852   2.4929
***** Episode 115242, Mean R = -15.9  Std R = 4.0  Min R = -26.3
PolicyLoss: -0.00309
Policy_Beta: 0.114
Policy_Entropy: 0.171
Policy_KL: 0.000872
Policy_SD: 0.527
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 4.26e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.993
VF_0_Loss : 9.68e-05


ADV1:  -0.0022517605812778173 0.008207754634987479 0.07244700949092031 -0.052098044446571075
ADV2:  0.04945131765189375 0.807953000136524 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8944   0.9554   3.8878  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0018   0.0062   6.6368   2.2852 

***** Episode 115490, Mean R = -17.2  Std R = 4.6  Min R = -29.0
PolicyLoss: -0.0198
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000903
Policy_SD: 0.543
Policy_lr_mult: 0.0878
Steps: 1.17e+04
TotalSteps: 4.27e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000242


ADV1:  -0.003529571892039937 0.010260702255066973 0.06528274221247488 -0.07360197571976473
ADV2:  0.04713236188516104 0.8672641874748648 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7459   1.1254   5.8090  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0092   6.6368   2.2852   2.4929
***** Episode 115521, Mean R = -18.6  Std R = 6.8  Min R = -30.4
PolicyLoss: -0.0246
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.000779
Policy_SD: 0.542
Policy_lr_mult: 0.0878
Steps: 1.18e+04
TotalSteps: 4.27e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.000421


ADV1:  0.0013600730759734893 0.0097011786009

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1779   1.3659   7.3964  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0005   0.0017   6.6368   2.2852   2.4929
***** Episode 115769, Mean R = -18.4  Std R = 5.2  Min R = -32.0
PolicyLoss: -0.0263
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000938
Policy_SD: 0.551
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 4.28e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.000148


ADV1:  -0.0005043557559573789 0.006207801223173945 0.03920151398011201 -0.043360384683651
ADV2:  0.01683211129070971 0.879651051456875 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7570   1.0590   4.3712  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0017   6.6368   2.2852   2.4929
***** Episode 115800, Mean R = -16.6  Std R = 5.0  Min R = -33.5
PolicyLoss: -0.0147
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.0008

ADV1:  0.0010009535042301068 0.00806415719861302 0.052474842290378076 -0.07038173434894733
ADV2:  0.010100199908753287 0.8326183750219078 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5138   0.8077   4.3811  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0030   6.6368   2.2852   2.4929
***** Episode 116048, Mean R = -16.9  Std R = 5.6  Min R = -30.1
PolicyLoss: -0.0241
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.00109
Policy_SD: 0.55
Policy_lr_mult: 0.0878
Steps: 1.15e+04
TotalSteps: 4.29e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000236


ADV1:  -0.0009190211757761033 0.005271205480840304 0.05043159371865108 -0.0448280534310328
ADV2:  0.012885153627161899 0.9232217190597162 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4950   0.9779   5.2269  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0026   6.6368   2.2852   2

***** Episode 116296, Mean R = -17.3  Std R = 5.4  Min R = -33.8
PolicyLoss: -0.0321
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00112
Policy_SD: 0.54
Policy_lr_mult: 0.0878
Steps: 1.16e+04
TotalSteps: 4.3e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.000197


ADV1:  0.001465627773754055 0.005797450786949508 0.047392019599448 -0.03529187660410706
ADV2:  -0.01607782246536951 0.905127998912903 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9900   0.4216   1.9968  37.2774  23.1806  15.1808
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0014   0.0046   6.6368   2.2852   2.4929
***** Episode 116327, Mean R = -16.3  Std R = 5.6  Min R = -31.7
PolicyLoss: -0.00181
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000957
Policy_SD: 0.524
Policy_lr_mult: 0.0878
Steps: 1.18e+04
TotalSteps: 4.3e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.993
VF_0_Loss : 0.000177


ADV1:  0.00042650503016648664 0.007070303702535383 

seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -1.00   -0.93 |    1.00    0.99
cs_angles |  0.0004 -0.0005 |  0.0837  0.0832 | -0.9966 -0.9253 |  0.9970  0.9920
optical_flow | -0.0001  0.0003 |  0.0241  0.0248 | -1.1633 -0.9830 |  1.1307  1.2359
v_err    | -0.0092 |  0.0546 | -0.4529 |  0.1049
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -21.93 |    4.90 |  -49.51 |  -13.73
steps    |     379 |      20 |     336 |     417
***** Episode 116606, Mean R = -15.2  Std R = 4.6  Min R = -28.0
PolicyLoss: -0.0183
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.0009
Policy_SD: 0.532
Policy_lr_mult: 0.0878
Steps: 1.18e+04
TotalSteps: 4.31e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.993
VF_0_Loss : 0.000181


ADV1:  -0.0021960640827476 0.010075339297812251 0.032185956164992646 -0.06522193875132325
ADV2:  0.037039953882071514 0.8719107835317574 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/M

attitude |    0.04   -0.02    0.14 |    1.11    0.64    1.79 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |   -0.02    0.11 |    0.63    1.77 |   -1.53   -3.07 |    1.50    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.24 |    0.23 |   -1.79 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.04
seeker_angles |    0.00   -0.00 |    0.09    0.08 |   -0.99   -1.00 |    0.98    0.98
cs_angles |  0.0043 -0.0009 |  0.0851  0.0809 | -0.9878 -0.9988 |  0.9765  0.9803
optical_flow |  0.0000  0.0001 |  0.0240  0.0243 | -0.9614 -1.0692 |  1.0316  1.2429
v_err    | -0.0092 |  0.0547 | -0.4532 |  0.1071
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.02    0.01    0.00 |    1.18    0.68    1.80 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.10    0.07    0.07
a_f      |    0.01   -0.04 |    0.68    1.79 |   -1.35   -3.13 |    1.52    3.13
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.25 |    0.33 |   -3.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.08
seeker_angles |    0.00   -0.00 |    0.09    0.08 |   -0.96   -1.00 |    1.00    0.99
cs_angles |  0.0010 -0.0009 |  0.0856  0.0814 | -0.9576 -0.9964 |  0.9995  0.9909
optical_flow | -0.0000  0.0002 |  0.0244  0.0235 | -1.1051 -1.2718 |  1.0427  1.1183
v_err    | -0.0090 |  0.0544 | -0.4515 |  0.1060
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.05   -0.00    0.11 |    1.23    0.67    1.81 |   -3.14   -1.53   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |   -0.01    0.19 |    0.67    1.82 |   -1.47   -3.10 |    1.48    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.24 |    0.22 |   -1.53 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.31 |    0.00 |    3.00
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0001  0.0029 |  0.0807  0.0802 | -0.9958 -0.9887 |  0.9903  0.9988
optical_flow | -0.0001  0.0000 |  0.0246  0.0231 | -1.0621 -1.1610 |  1.4061  1.0088
v_err    | -0.0089 |  0.0546 | -0.4524 |  0.1051
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.05   -0.01   -0.11 |    1.19    0.67    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |   -0.02   -0.12 |    0.67    1.87 |   -1.50   -3.14 |    1.41    3.10
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.26 |    0.25 |   -1.67 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.30 |    0.00 |    2.84
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.99    0.97
cs_angles |  0.0021  0.0035 |  0.0818  0.0825 | -0.9975 -0.9915 |  0.9889  0.9721
optical_flow |  0.0000  0.0000 |  0.0235  0.0240 | -1.0996 -1.2521 |  1.0845  1.1761
v_err    | -0.0089 |  0.0546 | -0.4530 |  0.1071
landing_rewards |    9.29 |    2.57 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |    0.06    0.02 |    0.68    1.82 |   -1.45   -3.11 |    1.56    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.24 |    0.24 |   -1.93 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.30 |    0.00 |    2.73
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -0.99   -0.98 |    0.97    0.98
cs_angles |  0.0021 -0.0002 |  0.0812  0.0814 | -0.9943 -0.9761 |  0.9699  0.9761
optical_flow | -0.0001  0.0000 |  0.0233  0.0233 | -1.0599 -1.0274 |  1.0940  1.0368
v_err    | -0.0092 |  0.0544 | -0.4536 |  0.0968
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -21.72 |    4.41 |  -39.06 |  -14.59
steps    |     377 |  

attitude |    0.02   -0.05    0.18 |    1.15    0.65    1.79 |   -3.14   -1.54   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.07    0.07    0.07
a_f      |   -0.07    0.18 |    0.65    1.79 |   -1.48   -3.12 |    1.49    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.25 |    0.23 |   -1.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.03
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -0.96   -0.97 |    0.99    0.97
cs_angles |  0.0019  0.0025 |  0.0852  0.0819 | -0.9602 -0.9656 |  0.9928  0.9696
optical_flow |  0.0000  0.0001 |  0.0228  0.0229 | -0.9631 -0.9312 |  1.2014  1.1925
v_err    | -0.0088 |  0.0546 | -0.4539 |  0.1061
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.07    0.07    0.07
a_f      |    0.01    0.08 |    0.65    1.83 |   -1.41   -3.14 |    1.44    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.25 |    0.24 |   -1.43 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.30 |    0.00 |    2.82
seeker_angles |   -0.00    0.01 |    0.08    0.08 |   -0.98   -0.95 |    0.99    1.00
cs_angles | -0.0007  0.0056 |  0.0841  0.0811 | -0.9849 -0.9547 |  0.9940  0.9966
optical_flow |  0.0001  0.0000 |  0.0229  0.0236 | -0.9767 -1.1145 |  1.0601  0.9947
v_err    | -0.0091 |  0.0547 | -0.4534 |  0.1078
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.07 |    0.02
tracking_rewards |  -21.83 |    4.40 |  -40.10 |  -13.65
steps    |     377 |  

attitude |    0.03    0.02   -0.19 |    1.20    0.67    1.78 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.08    0.07    0.07
a_f      |    0.03   -0.21 |    0.68    1.80 |   -1.48   -3.13 |    1.46    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.03 |    0.03    0.02    0.02
w_rewards |   -0.29 |    0.26 |   -1.98 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.91
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.98   -0.98 |    0.89    0.99
cs_angles |  0.0031  0.0016 |  0.0840  0.0869 | -0.9831 -0.9798 |  0.8867  0.9938
optical_flow | -0.0003  0.0002 |  0.0238  0.0244 | -1.0636 -1.2343 |  0.9776  1.2631
v_err    | -0.0090 |  0.0546 | -0.4524 |  0.1040
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.14   -0.01    0.13 |    1.22    0.65    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |   -0.01    0.11 |    0.65    1.86 |   -1.52   -3.13 |    1.43    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.24 |    0.28 |   -2.87 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.30 |    0.00 |    3.09
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.99   -0.98 |    1.00    0.95
cs_angles | -0.0002  0.0024 |  0.0824  0.0785 | -0.9936 -0.9776 |  0.9976  0.9547
optical_flow | -0.0001  0.0001 |  0.0237  0.0245 | -1.2240 -0.9747 |  1.1258  1.3111
v_err    | -0.0088 |  0.0544 | -0.4525 |  0.1297
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.07    0.03    0.07 |    1.16    0.64    1.81 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.09    0.07    0.07
a_f      |    0.03    0.06 |    0.64    1.83 |   -1.44   -3.13 |    1.55    3.10
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.25 |    0.25 |   -2.64 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.30 |    0.00 |    2.65
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.98 |    0.99    0.98
cs_angles |  0.0021  0.0047 |  0.0804  0.0825 | -0.9962 -0.9820 |  0.9859  0.9757
optical_flow | -0.0000 -0.0001 |  0.0250  0.0248 | -1.0737 -1.1503 |  1.1484  1.2060
v_err    | -0.0087 |  0.0544 | -0.4514 |  0.1073
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

In [7]:
fname = "optimize_WATTVW_FOV-AR=5-RPT2"
policy.save_params(fname)


In [5]:
env.test_policy_batch(agent,5000,print_every=100,test_mode=True)

worked 1
Dynamics: Max Disturbance (m/s^2):  [0.00127313 0.00130788 0.00159816] 0.0024260046138067644


KeyboardInterrupt: 

In [6]:
print(1)

1
